1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  *	linux/arch/alpha/kernel/err_titan.c
4  *
5  *	Copyright (C) 2000 Jeff Wiedemeier (Compaq Computer Corporation)
6  *
7  *	Error handling code supporting TITAN systems
8  */
9 
10 #include <linux/init.h>
11 #include <linux/pci.h>
12 #include <linux/sched.h>
13 
14 #include <asm/io.h>
15 #include <asm/core_titan.h>
16 #include <asm/hwrpb.h>
17 #include <asm/smp.h>
18 #include <asm/err_common.h>
19 #include <asm/err_ev6.h>
20 #include <asm/irq_regs.h>
21 
22 #include "err_impl.h"
23 #include "proto.h"
24 
25 
26 static int
titan_parse_c_misc(u64 c_misc,int print)27 titan_parse_c_misc(u64 c_misc, int print)
28 {
29 #ifdef CONFIG_VERBOSE_MCHECK
30 	char *src;
31 	int nxs = 0;
32 #endif
33 	int status = MCHK_DISPOSITION_REPORT;
34 
35 #define TITAN__CCHIP_MISC__NXM		(1UL << 28)
36 #define TITAN__CCHIP_MISC__NXS__S	(29)
37 #define TITAN__CCHIP_MISC__NXS__M	(0x7)
38 
39 	if (!(c_misc & TITAN__CCHIP_MISC__NXM))
40 		return MCHK_DISPOSITION_UNKNOWN_ERROR;
41 
42 #ifdef CONFIG_VERBOSE_MCHECK
43 	if (!print)
44 		return status;
45 
46 	nxs = EXTRACT(c_misc, TITAN__CCHIP_MISC__NXS);
47 	switch(nxs) {
48 	case 0:	/* CPU 0 */
49 	case 1:	/* CPU 1 */
50 	case 2:	/* CPU 2 */
51 	case 3:	/* CPU 3 */
52 		src = "CPU";
53 		/* num is already the CPU number */
54 		break;
55 	case 4:	/* Pchip 0 */
56 	case 5:	/* Pchip 1 */
57 		src = "Pchip";
58 		nxs -= 4;
59 		break;
60 	default:/* reserved */
61 		src = "Unknown, NXS =";
62 		/* leave num untouched */
63 		break;
64 	}
65 
66 	printk("%s    Non-existent memory access from: %s %d\n",
67 	       err_print_prefix, src, nxs);
68 #endif /* CONFIG_VERBOSE_MCHECK */
69 
70 	return status;
71 }
72 
73 static int
titan_parse_p_serror(int which,u64 serror,int print)74 titan_parse_p_serror(int which, u64 serror, int print)
75 {
76 	int status = MCHK_DISPOSITION_REPORT;
77 
78 #ifdef CONFIG_VERBOSE_MCHECK
79 	static const char * const serror_src[] = {
80 		"GPCI", "APCI", "AGP HP", "AGP LP"
81 	};
82 	static const char * const serror_cmd[] = {
83 		"DMA Read", "DMA RMW", "SGTE Read", "Reserved"
84 	};
85 #endif /* CONFIG_VERBOSE_MCHECK */
86 
87 #define TITAN__PCHIP_SERROR__LOST_UECC	(1UL << 0)
88 #define TITAN__PCHIP_SERROR__UECC	(1UL << 1)
89 #define TITAN__PCHIP_SERROR__CRE	(1UL << 2)
90 #define TITAN__PCHIP_SERROR__NXIO	(1UL << 3)
91 #define TITAN__PCHIP_SERROR__LOST_CRE	(1UL << 4)
92 #define TITAN__PCHIP_SERROR__ECCMASK	(TITAN__PCHIP_SERROR__UECC |	  \
93 					 TITAN__PCHIP_SERROR__CRE)
94 #define TITAN__PCHIP_SERROR__ERRMASK	(TITAN__PCHIP_SERROR__LOST_UECC | \
95 					 TITAN__PCHIP_SERROR__UECC |	  \
96 					 TITAN__PCHIP_SERROR__CRE |	  \
97 					 TITAN__PCHIP_SERROR__NXIO |	  \
98 					 TITAN__PCHIP_SERROR__LOST_CRE)
99 #define TITAN__PCHIP_SERROR__SRC__S	(52)
100 #define TITAN__PCHIP_SERROR__SRC__M	(0x3)
101 #define TITAN__PCHIP_SERROR__CMD__S	(54)
102 #define TITAN__PCHIP_SERROR__CMD__M	(0x3)
103 #define TITAN__PCHIP_SERROR__SYN__S	(56)
104 #define TITAN__PCHIP_SERROR__SYN__M	(0xff)
105 #define TITAN__PCHIP_SERROR__ADDR__S	(15)
106 #define TITAN__PCHIP_SERROR__ADDR__M	(0xffffffffUL)
107 
108 	if (!(serror & TITAN__PCHIP_SERROR__ERRMASK))
109 		return MCHK_DISPOSITION_UNKNOWN_ERROR;
110 
111 #ifdef CONFIG_VERBOSE_MCHECK
112 	if (!print)
113 		return status;
114 
115 	printk("%s  PChip %d SERROR: %016llx\n",
116 	       err_print_prefix, which, serror);
117 	if (serror & TITAN__PCHIP_SERROR__ECCMASK) {
118 		printk("%s    %sorrectable ECC Error:\n"
119 		       "      Source: %-6s  Command: %-8s  Syndrome: 0x%08x\n"
120 		       "      Address: 0x%llx\n",
121 		       err_print_prefix,
122 		       (serror & TITAN__PCHIP_SERROR__UECC) ? "Unc" : "C",
123 		       serror_src[EXTRACT(serror, TITAN__PCHIP_SERROR__SRC)],
124 		       serror_cmd[EXTRACT(serror, TITAN__PCHIP_SERROR__CMD)],
125 		       (unsigned)EXTRACT(serror, TITAN__PCHIP_SERROR__SYN),
126 		       EXTRACT(serror, TITAN__PCHIP_SERROR__ADDR));
127 	}
128 	if (serror & TITAN__PCHIP_SERROR__NXIO)
129 		printk("%s    Non Existent I/O Error\n", err_print_prefix);
130 	if (serror & TITAN__PCHIP_SERROR__LOST_UECC)
131 		printk("%s    Lost Uncorrectable ECC Error\n",
132 		       err_print_prefix);
133 	if (serror & TITAN__PCHIP_SERROR__LOST_CRE)
134 		printk("%s    Lost Correctable ECC Error\n", err_print_prefix);
135 #endif /* CONFIG_VERBOSE_MCHECK */
136 
137 	return status;
138 }
139 
140 static int
titan_parse_p_perror(int which,int port,u64 perror,int print)141 titan_parse_p_perror(int which, int port, u64 perror, int print)
142 {
143 	int cmd;
144 	unsigned long addr;
145 	int status = MCHK_DISPOSITION_REPORT;
146 
147 #ifdef CONFIG_VERBOSE_MCHECK
148 	static const char * const perror_cmd[] = {
149 		"Interrupt Acknowledge", "Special Cycle",
150 		"I/O Read",		"I/O Write",
151 		"Reserved",		"Reserved",
152 		"Memory Read",		"Memory Write",
153 		"Reserved",		"Reserved",
154 		"Configuration Read",	"Configuration Write",
155 		"Memory Read Multiple",	"Dual Address Cycle",
156 		"Memory Read Line",	"Memory Write and Invalidate"
157 	};
158 #endif /* CONFIG_VERBOSE_MCHECK */
159 
160 #define TITAN__PCHIP_PERROR__LOST	(1UL << 0)
161 #define TITAN__PCHIP_PERROR__SERR	(1UL << 1)
162 #define TITAN__PCHIP_PERROR__PERR	(1UL << 2)
163 #define TITAN__PCHIP_PERROR__DCRTO	(1UL << 3)
164 #define TITAN__PCHIP_PERROR__SGE	(1UL << 4)
165 #define TITAN__PCHIP_PERROR__APE	(1UL << 5)
166 #define TITAN__PCHIP_PERROR__TA		(1UL << 6)
167 #define TITAN__PCHIP_PERROR__DPE	(1UL << 7)
168 #define TITAN__PCHIP_PERROR__NDS	(1UL << 8)
169 #define TITAN__PCHIP_PERROR__IPTPR	(1UL << 9)
170 #define TITAN__PCHIP_PERROR__IPTPW	(1UL << 10)
171 #define TITAN__PCHIP_PERROR__ERRMASK	(TITAN__PCHIP_PERROR__LOST |	\
172 					 TITAN__PCHIP_PERROR__SERR |	\
173 					 TITAN__PCHIP_PERROR__PERR |	\
174 					 TITAN__PCHIP_PERROR__DCRTO |	\
175 					 TITAN__PCHIP_PERROR__SGE |	\
176 					 TITAN__PCHIP_PERROR__APE |	\
177 					 TITAN__PCHIP_PERROR__TA |	\
178 					 TITAN__PCHIP_PERROR__DPE |	\
179 					 TITAN__PCHIP_PERROR__NDS |	\
180 					 TITAN__PCHIP_PERROR__IPTPR |	\
181 					 TITAN__PCHIP_PERROR__IPTPW)
182 #define TITAN__PCHIP_PERROR__DAC	(1UL << 47)
183 #define TITAN__PCHIP_PERROR__MWIN	(1UL << 48)
184 #define TITAN__PCHIP_PERROR__CMD__S	(52)
185 #define TITAN__PCHIP_PERROR__CMD__M	(0x0f)
186 #define TITAN__PCHIP_PERROR__ADDR__S	(14)
187 #define TITAN__PCHIP_PERROR__ADDR__M	(0x1fffffffful)
188 
189 	if (!(perror & TITAN__PCHIP_PERROR__ERRMASK))
190 		return MCHK_DISPOSITION_UNKNOWN_ERROR;
191 
192 	cmd = EXTRACT(perror, TITAN__PCHIP_PERROR__CMD);
193 	addr = EXTRACT(perror, TITAN__PCHIP_PERROR__ADDR) << 2;
194 
195 	/*
196 	 * Initializing the BIOS on a video card on a bus without
197 	 * a south bridge (subtractive decode agent) can result in
198 	 * master aborts as the BIOS probes the capabilities of the
199 	 * card. XFree86 does such initialization. If the error
200 	 * is a master abort (No DevSel as PCI Master) and the command
201 	 * is an I/O read or write below the address where we start
202 	 * assigning PCI I/O spaces (SRM uses 0x1000), then mark the
203 	 * error as dismissable so starting XFree86 doesn't result
204 	 * in a series of uncorrectable errors being reported. Also
205 	 * dismiss master aborts to VGA frame buffer space
206 	 * (0xA0000 - 0xC0000) and legacy BIOS space (0xC0000 - 0x100000)
207 	 * for the same reason.
208 	 *
209 	 * Also mark the error dismissible if it looks like the right
210 	 * error but only the Lost bit is set. Since the BIOS initialization
211 	 * can cause multiple master aborts and the error interrupt can
212 	 * be handled on a different CPU than the BIOS code is run on,
213 	 * it is possible for a second master abort to occur between the
214 	 * time the PALcode reads PERROR and the time it writes PERROR
215 	 * to acknowledge the error. If this timing happens, a second
216 	 * error will be signalled after the first, and if no additional
217 	 * errors occur, will look like a Lost error with no additional
218 	 * errors on the same transaction as the previous error.
219 	 */
220 	if (((perror & TITAN__PCHIP_PERROR__NDS) ||
221 	     ((perror & TITAN__PCHIP_PERROR__ERRMASK) ==
222 	      TITAN__PCHIP_PERROR__LOST)) &&
223 	    ((((cmd & 0xE) == 2) && (addr < 0x1000)) ||
224 	     (((cmd & 0xE) == 6) && (addr >= 0xA0000) && (addr < 0x100000)))) {
225 		status = MCHK_DISPOSITION_DISMISS;
226 	}
227 
228 #ifdef CONFIG_VERBOSE_MCHECK
229 	if (!print)
230 		return status;
231 
232 	printk("%s  PChip %d %cPERROR: %016llx\n",
233 	       err_print_prefix, which,
234 	       port ? 'A' : 'G', perror);
235 	if (perror & TITAN__PCHIP_PERROR__IPTPW)
236 		printk("%s    Invalid Peer-to-Peer Write\n", err_print_prefix);
237 	if (perror & TITAN__PCHIP_PERROR__IPTPR)
238 		printk("%s    Invalid Peer-to-Peer Read\n", err_print_prefix);
239 	if (perror & TITAN__PCHIP_PERROR__NDS)
240 		printk("%s    No DEVSEL as PCI Master [Master Abort]\n",
241 		       err_print_prefix);
242 	if (perror & TITAN__PCHIP_PERROR__DPE)
243 		printk("%s    Data Parity Error\n", err_print_prefix);
244 	if (perror & TITAN__PCHIP_PERROR__TA)
245 		printk("%s    Target Abort\n", err_print_prefix);
246 	if (perror & TITAN__PCHIP_PERROR__APE)
247 		printk("%s    Address Parity Error\n", err_print_prefix);
248 	if (perror & TITAN__PCHIP_PERROR__SGE)
249 		printk("%s    Scatter-Gather Error, Invalid PTE\n",
250 		       err_print_prefix);
251 	if (perror & TITAN__PCHIP_PERROR__DCRTO)
252 		printk("%s    Delayed-Completion Retry Timeout\n",
253 		       err_print_prefix);
254 	if (perror & TITAN__PCHIP_PERROR__PERR)
255 		printk("%s    PERR Asserted\n", err_print_prefix);
256 	if (perror & TITAN__PCHIP_PERROR__SERR)
257 		printk("%s    SERR Asserted\n", err_print_prefix);
258 	if (perror & TITAN__PCHIP_PERROR__LOST)
259 		printk("%s    Lost Error\n", err_print_prefix);
260 	printk("%s      Command: 0x%x - %s\n"
261 		 "      Address: 0x%lx\n",
262 	       err_print_prefix,
263 	       cmd, perror_cmd[cmd],
264 	       addr);
265 	if (perror & TITAN__PCHIP_PERROR__DAC)
266 		printk("%s      Dual Address Cycle\n", err_print_prefix);
267 	if (perror & TITAN__PCHIP_PERROR__MWIN)
268 		printk("%s      Hit in Monster Window\n", err_print_prefix);
269 #endif /* CONFIG_VERBOSE_MCHECK */
270 
271 	return status;
272 }
273 
274 static int
titan_parse_p_agperror(int which,u64 agperror,int print)275 titan_parse_p_agperror(int which, u64 agperror, int print)
276 {
277 	int status = MCHK_DISPOSITION_REPORT;
278 #ifdef CONFIG_VERBOSE_MCHECK
279 	int cmd, len;
280 	unsigned long addr;
281 
282 	static const char * const agperror_cmd[] = {
283 		"Read (low-priority)",	"Read (high-priority)",
284 		"Write (low-priority)",	"Write (high-priority)",
285 		"Reserved",		"Reserved",
286 		"Flush",		"Fence"
287 	};
288 #endif /* CONFIG_VERBOSE_MCHECK */
289 
290 #define TITAN__PCHIP_AGPERROR__LOST	(1UL << 0)
291 #define TITAN__PCHIP_AGPERROR__LPQFULL	(1UL << 1)
292 #define TITAN__PCHIP_AGPERROR__HPQFULL	(1UL << 2)
293 #define TITAN__PCHIP_AGPERROR__RESCMD	(1UL << 3)
294 #define TITAN__PCHIP_AGPERROR__IPTE	(1UL << 4)
295 #define TITAN__PCHIP_AGPERROR__PTP	(1UL << 5)
296 #define TITAN__PCHIP_AGPERROR__NOWINDOW	(1UL << 6)
297 #define TITAN__PCHIP_AGPERROR__ERRMASK	(TITAN__PCHIP_AGPERROR__LOST |    \
298 					 TITAN__PCHIP_AGPERROR__LPQFULL | \
299 					 TITAN__PCHIP_AGPERROR__HPQFULL | \
300 					 TITAN__PCHIP_AGPERROR__RESCMD |  \
301 					 TITAN__PCHIP_AGPERROR__IPTE |    \
302 					 TITAN__PCHIP_AGPERROR__PTP |     \
303 					 TITAN__PCHIP_AGPERROR__NOWINDOW)
304 #define TITAN__PCHIP_AGPERROR__DAC	(1UL << 48)
305 #define TITAN__PCHIP_AGPERROR__MWIN	(1UL << 49)
306 #define TITAN__PCHIP_AGPERROR__FENCE	(1UL << 59)
307 #define TITAN__PCHIP_AGPERROR__CMD__S	(50)
308 #define TITAN__PCHIP_AGPERROR__CMD__M	(0x07)
309 #define TITAN__PCHIP_AGPERROR__ADDR__S	(15)
310 #define TITAN__PCHIP_AGPERROR__ADDR__M  (0xffffffffUL)
311 #define TITAN__PCHIP_AGPERROR__LEN__S	(53)
312 #define TITAN__PCHIP_AGPERROR__LEN__M	(0x3f)
313 
314 	if (!(agperror & TITAN__PCHIP_AGPERROR__ERRMASK))
315 		return MCHK_DISPOSITION_UNKNOWN_ERROR;
316 
317 #ifdef CONFIG_VERBOSE_MCHECK
318 	if (!print)
319 		return status;
320 
321 	cmd = EXTRACT(agperror, TITAN__PCHIP_AGPERROR__CMD);
322 	addr = EXTRACT(agperror, TITAN__PCHIP_AGPERROR__ADDR) << 3;
323 	len = EXTRACT(agperror, TITAN__PCHIP_AGPERROR__LEN);
324 
325 	printk("%s  PChip %d AGPERROR: %016llx\n", err_print_prefix,
326 	       which, agperror);
327 	if (agperror & TITAN__PCHIP_AGPERROR__NOWINDOW)
328 		printk("%s    No Window\n", err_print_prefix);
329 	if (agperror & TITAN__PCHIP_AGPERROR__PTP)
330 		printk("%s    Peer-to-Peer set\n", err_print_prefix);
331 	if (agperror & TITAN__PCHIP_AGPERROR__IPTE)
332 		printk("%s    Invalid PTE\n", err_print_prefix);
333 	if (agperror & TITAN__PCHIP_AGPERROR__RESCMD)
334 		printk("%s    Reserved Command\n", err_print_prefix);
335 	if (agperror & TITAN__PCHIP_AGPERROR__HPQFULL)
336 		printk("%s    HP Transaction Received while Queue Full\n",
337 		       err_print_prefix);
338 	if (agperror & TITAN__PCHIP_AGPERROR__LPQFULL)
339 		printk("%s    LP Transaction Received while Queue Full\n",
340 		       err_print_prefix);
341 	if (agperror & TITAN__PCHIP_AGPERROR__LOST)
342 		printk("%s    Lost Error\n", err_print_prefix);
343 	printk("%s      Command: 0x%x - %s, %d Quadwords%s\n"
344 		 "      Address: 0x%lx\n",
345 	       err_print_prefix, cmd, agperror_cmd[cmd], len,
346 	       (agperror & TITAN__PCHIP_AGPERROR__FENCE) ? ", FENCE" : "",
347 	       addr);
348 	if (agperror & TITAN__PCHIP_AGPERROR__DAC)
349 		printk("%s      Dual Address Cycle\n", err_print_prefix);
350 	if (agperror & TITAN__PCHIP_AGPERROR__MWIN)
351 		printk("%s      Hit in Monster Window\n", err_print_prefix);
352 #endif /* CONFIG_VERBOSE_MCHECK */
353 
354 	return status;
355 }
356 
357 static int
titan_parse_p_chip(int which,u64 serror,u64 gperror,u64 aperror,u64 agperror,int print)358 titan_parse_p_chip(int which, u64 serror, u64 gperror,
359 		   u64 aperror, u64 agperror, int print)
360 {
361 	int status = MCHK_DISPOSITION_UNKNOWN_ERROR;
362 	status |= titan_parse_p_serror(which, serror, print);
363 	status |= titan_parse_p_perror(which, 0, gperror, print);
364 	status |= titan_parse_p_perror(which, 1, aperror, print);
365 	status |= titan_parse_p_agperror(which, agperror, print);
366 	return status;
367 }
368 
369 int
titan_process_logout_frame(struct el_common * mchk_header,int print)370 titan_process_logout_frame(struct el_common *mchk_header, int print)
371 {
372 	struct el_TITAN_sysdata_mcheck *tmchk =
373 		(struct el_TITAN_sysdata_mcheck *)
374 		((unsigned long)mchk_header + mchk_header->sys_offset);
375 	int status = MCHK_DISPOSITION_UNKNOWN_ERROR;
376 
377 	status |= titan_parse_c_misc(tmchk->c_misc, print);
378 	status |= titan_parse_p_chip(0, tmchk->p0_serror, tmchk->p0_gperror,
379 				     tmchk->p0_aperror, tmchk->p0_agperror,
380 				     print);
381 	status |= titan_parse_p_chip(1, tmchk->p1_serror, tmchk->p1_gperror,
382 				     tmchk->p1_aperror, tmchk->p1_agperror,
383 				     print);
384 
385 	return status;
386 }
387 
388 void
titan_machine_check(unsigned long vector,unsigned long la_ptr)389 titan_machine_check(unsigned long vector, unsigned long la_ptr)
390 {
391 	struct el_common *mchk_header = (struct el_common *)la_ptr;
392 	struct el_TITAN_sysdata_mcheck *tmchk =
393 		(struct el_TITAN_sysdata_mcheck *)
394 		((unsigned long)mchk_header + mchk_header->sys_offset);
395 	u64 irqmask;
396 
397 	/*
398 	 * Mask of Titan interrupt sources which are reported as machine checks
399 	 *
400 	 * 63 - CChip Error
401 	 * 62 - PChip 0 H_Error
402 	 * 61 - PChip 1 H_Error
403 	 * 60 - PChip 0 C_Error
404 	 * 59 - PChip 1 C_Error
405 	 */
406 #define TITAN_MCHECK_INTERRUPT_MASK	0xF800000000000000UL
407 
408 	/*
409 	 * Sync the processor
410 	 */
411 	mb();
412 	draina();
413 
414 	/*
415 	 * Only handle system errors here
416 	 */
417 	if ((vector != SCB_Q_SYSMCHK) && (vector != SCB_Q_SYSERR)) {
418 		ev6_machine_check(vector, la_ptr);
419 		return;
420 	}
421 
422 	/*
423 	 * It's a system error, handle it here
424 	 *
425 	 * The PALcode has already cleared the error, so just parse it
426 	 */
427 
428 	/*
429 	 * Parse the logout frame without printing first. If the only error(s)
430 	 * found are classified as "dismissable", then just dismiss them and
431 	 * don't print any message
432 	 */
433 	if (titan_process_logout_frame(mchk_header, 0) !=
434 	    MCHK_DISPOSITION_DISMISS) {
435 		char *saved_err_prefix = err_print_prefix;
436 		err_print_prefix = KERN_CRIT;
437 
438 		/*
439 		 * Either a nondismissable error was detected or no
440 		 * recognized error was detected  in the logout frame
441 		 * -- report the error in either case
442 		 */
443 		printk("%s"
444 		       "*System %s Error (Vector 0x%x) reported on CPU %d:\n",
445 		       err_print_prefix,
446 		       (vector == SCB_Q_SYSERR)?"Correctable":"Uncorrectable",
447 		       (unsigned int)vector, (int)smp_processor_id());
448 
449 #ifdef CONFIG_VERBOSE_MCHECK
450 		titan_process_logout_frame(mchk_header, alpha_verbose_mcheck);
451 		if (alpha_verbose_mcheck)
452 			dik_show_regs(get_irq_regs(), NULL);
453 #endif /* CONFIG_VERBOSE_MCHECK */
454 
455 		err_print_prefix = saved_err_prefix;
456 
457 		/*
458 		 * Convert any pending interrupts which report as system
459 		 * machine checks to interrupts
460 		 */
461 		irqmask = tmchk->c_dirx & TITAN_MCHECK_INTERRUPT_MASK;
462 		titan_dispatch_irqs(irqmask);
463 	}
464 
465 
466 	/*
467 	 * Release the logout frame
468 	 */
469 	wrmces(0x7);
470 	mb();
471 }
472 
473 /*
474  * Subpacket Annotations
475  */
476 static char *el_titan_pchip0_extended_annotation[] = {
477 	"Subpacket Header", 	"P0_SCTL",	"P0_SERREN",
478 	"P0_APCTL",		"P0_APERREN",	"P0_AGPERREN",
479 	"P0_ASPRST",		"P0_AWSBA0",	"P0_AWSBA1",
480 	"P0_AWSBA2",		"P0_AWSBA3",	"P0_AWSM0",
481 	"P0_AWSM1",		"P0_AWSM2",	"P0_AWSM3",
482 	"P0_ATBA0",		"P0_ATBA1",	"P0_ATBA2",
483 	"P0_ATBA3",		"P0_GPCTL",	"P0_GPERREN",
484 	"P0_GSPRST",		"P0_GWSBA0",	"P0_GWSBA1",
485 	"P0_GWSBA2",		"P0_GWSBA3",	"P0_GWSM0",
486 	"P0_GWSM1",		"P0_GWSM2",	"P0_GWSM3",
487 	"P0_GTBA0",		"P0_GTBA1",	"P0_GTBA2",
488 	"P0_GTBA3",		NULL
489 };
490 static char *el_titan_pchip1_extended_annotation[] = {
491 	"Subpacket Header", 	"P1_SCTL",	"P1_SERREN",
492 	"P1_APCTL",		"P1_APERREN",	"P1_AGPERREN",
493 	"P1_ASPRST",		"P1_AWSBA0",	"P1_AWSBA1",
494 	"P1_AWSBA2",		"P1_AWSBA3",	"P1_AWSM0",
495 	"P1_AWSM1",		"P1_AWSM2",	"P1_AWSM3",
496 	"P1_ATBA0",		"P1_ATBA1",	"P1_ATBA2",
497 	"P1_ATBA3",		"P1_GPCTL",	"P1_GPERREN",
498 	"P1_GSPRST",		"P1_GWSBA0",	"P1_GWSBA1",
499 	"P1_GWSBA2",		"P1_GWSBA3",	"P1_GWSM0",
500 	"P1_GWSM1",		"P1_GWSM2",	"P1_GWSM3",
501 	"P1_GTBA0",		"P1_GTBA1",	"P1_GTBA2",
502 	"P1_GTBA3",		NULL
503 };
504 static char *el_titan_memory_extended_annotation[] = {
505 	"Subpacket Header", 	"AAR0",		"AAR1",
506 	"AAR2",			"AAR3",		"P0_SCTL",
507 	"P0_GPCTL",		"P0_APCTL",	"P1_SCTL",
508 	"P1_GPCTL",		"P1_SCTL",	NULL
509 };
510 
511 static struct el_subpacket_annotation el_titan_annotations[] = {
512 	SUBPACKET_ANNOTATION(EL_CLASS__REGATTA_FAMILY,
513 			     EL_TYPE__REGATTA__TITAN_PCHIP0_EXTENDED,
514 			     1,
515 			     "Titan PChip 0 Extended Frame",
516 			     el_titan_pchip0_extended_annotation),
517 	SUBPACKET_ANNOTATION(EL_CLASS__REGATTA_FAMILY,
518 			     EL_TYPE__REGATTA__TITAN_PCHIP1_EXTENDED,
519 			     1,
520 			     "Titan PChip 1 Extended Frame",
521 			     el_titan_pchip1_extended_annotation),
522 	SUBPACKET_ANNOTATION(EL_CLASS__REGATTA_FAMILY,
523 			     EL_TYPE__REGATTA__TITAN_MEMORY_EXTENDED,
524 			     1,
525 			     "Titan Memory Extended Frame",
526 			     el_titan_memory_extended_annotation),
527 	SUBPACKET_ANNOTATION(EL_CLASS__REGATTA_FAMILY,
528 			     EL_TYPE__TERMINATION__TERMINATION,
529 			     1,
530 			     "Termination Subpacket",
531 			     NULL)
532 };
533 
534 static struct el_subpacket *
el_process_regatta_subpacket(struct el_subpacket * header)535 el_process_regatta_subpacket(struct el_subpacket *header)
536 {
537 	if (header->class != EL_CLASS__REGATTA_FAMILY) {
538 		printk("%s  ** Unexpected header CLASS %d TYPE %d, aborting\n",
539 		       err_print_prefix,
540 		       header->class, header->type);
541 		return NULL;
542 	}
543 
544 	switch(header->type) {
545 	case EL_TYPE__REGATTA__PROCESSOR_ERROR_FRAME:
546 	case EL_TYPE__REGATTA__SYSTEM_ERROR_FRAME:
547 	case EL_TYPE__REGATTA__ENVIRONMENTAL_FRAME:
548 	case EL_TYPE__REGATTA__PROCESSOR_DBL_ERROR_HALT:
549 	case EL_TYPE__REGATTA__SYSTEM_DBL_ERROR_HALT:
550 		printk("%s  ** Occurred on CPU %d:\n",
551 		       err_print_prefix,
552 		       (int)header->by_type.regatta_frame.cpuid);
553 		privateer_process_logout_frame((struct el_common *)
554 			header->by_type.regatta_frame.data_start, 1);
555 		break;
556 	default:
557 		printk("%s  ** REGATTA TYPE %d SUBPACKET\n",
558 		       err_print_prefix, header->type);
559 		el_annotate_subpacket(header);
560 		break;
561 	}
562 
563 
564 	return (struct el_subpacket *)((unsigned long)header + header->length);
565 }
566 
567 static struct el_subpacket_handler titan_subpacket_handler =
568 	SUBPACKET_HANDLER_INIT(EL_CLASS__REGATTA_FAMILY,
569 			       el_process_regatta_subpacket);
570 
571 void __init
titan_register_error_handlers(void)572 titan_register_error_handlers(void)
573 {
574 	size_t i;
575 
576 	for (i = 0; i < ARRAY_SIZE (el_titan_annotations); i++)
577 		cdl_register_subpacket_annotation(&el_titan_annotations[i]);
578 
579 	cdl_register_subpacket_handler(&titan_subpacket_handler);
580 
581 	ev6_register_error_handlers();
582 }
583 
584 
585 /*
586  * Privateer
587  */
588 
589 static int
privateer_process_680_frame(struct el_common * mchk_header,int print)590 privateer_process_680_frame(struct el_common *mchk_header, int print)
591 {
592 	int status = MCHK_DISPOSITION_UNKNOWN_ERROR;
593 #ifdef CONFIG_VERBOSE_MCHECK
594 	struct el_PRIVATEER_envdata_mcheck *emchk =
595 		(struct el_PRIVATEER_envdata_mcheck *)
596 		((unsigned long)mchk_header + mchk_header->sys_offset);
597 
598 	/* TODO - categorize errors, for now, no error */
599 
600 	if (!print)
601 		return status;
602 
603 	/* TODO - decode instead of just dumping... */
604 	printk("%s  Summary Flags:         %016llx\n"
605  	         "  CChip DIRx:            %016llx\n"
606 		 "  System Management IR:  %016llx\n"
607 		 "  CPU IR:                %016llx\n"
608 		 "  Power Supply IR:       %016llx\n"
609 		 "  LM78 Fault Status:     %016llx\n"
610 		 "  System Doors:          %016llx\n"
611 		 "  Temperature Warning:   %016llx\n"
612 		 "  Fan Control:           %016llx\n"
613 		 "  Fatal Power Down Code: %016llx\n",
614 	       err_print_prefix,
615 	       emchk->summary,
616 	       emchk->c_dirx,
617 	       emchk->smir,
618 	       emchk->cpuir,
619 	       emchk->psir,
620 	       emchk->fault,
621 	       emchk->sys_doors,
622 	       emchk->temp_warn,
623 	       emchk->fan_ctrl,
624 	       emchk->code);
625 #endif /* CONFIG_VERBOSE_MCHECK */
626 
627 	return status;
628 }
629 
630 int
privateer_process_logout_frame(struct el_common * mchk_header,int print)631 privateer_process_logout_frame(struct el_common *mchk_header, int print)
632 {
633 	struct el_common_EV6_mcheck *ev6mchk =
634 		(struct el_common_EV6_mcheck *)mchk_header;
635 	int status = MCHK_DISPOSITION_UNKNOWN_ERROR;
636 
637 	/*
638 	 * Machine check codes
639 	 */
640 #define PRIVATEER_MCHK__CORR_ECC		0x86	/* 630 */
641 #define PRIVATEER_MCHK__DC_TAG_PERR		0x9E	/* 630 */
642 #define PRIVATEER_MCHK__PAL_BUGCHECK		0x8E	/* 670 */
643 #define PRIVATEER_MCHK__OS_BUGCHECK		0x90	/* 670 */
644 #define PRIVATEER_MCHK__PROC_HRD_ERR		0x98	/* 670 */
645 #define PRIVATEER_MCHK__ISTREAM_CMOV_PRX	0xA0	/* 670 */
646 #define PRIVATEER_MCHK__ISTREAM_CMOV_FLT	0xA2	/* 670 */
647 #define PRIVATEER_MCHK__SYS_HRD_ERR		0x202	/* 660 */
648 #define PRIVATEER_MCHK__SYS_CORR_ERR		0x204	/* 620 */
649 #define PRIVATEER_MCHK__SYS_ENVIRON		0x206	/* 680 */
650 
651 	switch(ev6mchk->MCHK_Code) {
652 	/*
653 	 * Vector 630 - Processor, Correctable
654 	 */
655 	case PRIVATEER_MCHK__CORR_ECC:
656 	case PRIVATEER_MCHK__DC_TAG_PERR:
657 		/*
658 		 * Fall through to vector 670 for processing...
659 		 */
660 	/*
661 	 * Vector 670 - Processor, Uncorrectable
662 	 */
663 	case PRIVATEER_MCHK__PAL_BUGCHECK:
664 	case PRIVATEER_MCHK__OS_BUGCHECK:
665 	case PRIVATEER_MCHK__PROC_HRD_ERR:
666 	case PRIVATEER_MCHK__ISTREAM_CMOV_PRX:
667 	case PRIVATEER_MCHK__ISTREAM_CMOV_FLT:
668 		status |= ev6_process_logout_frame(mchk_header, print);
669 		break;
670 
671 	/*
672 	 * Vector 620 - System, Correctable
673 	 */
674 	case PRIVATEER_MCHK__SYS_CORR_ERR:
675 		/*
676 		 * Fall through to vector 660 for processing...
677 		 */
678 	/*
679 	 * Vector 660 - System, Uncorrectable
680 	 */
681 	case PRIVATEER_MCHK__SYS_HRD_ERR:
682 		status |= titan_process_logout_frame(mchk_header, print);
683 		break;
684 
685 	/*
686 	 * Vector 680 - System, Environmental
687 	 */
688 	case PRIVATEER_MCHK__SYS_ENVIRON:	/* System, Environmental */
689 		status |= privateer_process_680_frame(mchk_header, print);
690 		break;
691 
692 	/*
693 	 * Unknown
694 	 */
695 	default:
696 		status |= MCHK_DISPOSITION_REPORT;
697 		if (print) {
698 			printk("%s** Unknown Error, frame follows\n",
699 			       err_print_prefix);
700 			mchk_dump_logout_frame(mchk_header);
701 		}
702 
703 	}
704 
705 	return status;
706 }
707 
708 void
privateer_machine_check(unsigned long vector,unsigned long la_ptr)709 privateer_machine_check(unsigned long vector, unsigned long la_ptr)
710 {
711 	struct el_common *mchk_header = (struct el_common *)la_ptr;
712 	struct el_TITAN_sysdata_mcheck *tmchk =
713 		(struct el_TITAN_sysdata_mcheck *)
714 		(la_ptr + mchk_header->sys_offset);
715 	u64 irqmask;
716 	char *saved_err_prefix = err_print_prefix;
717 
718 #define PRIVATEER_680_INTERRUPT_MASK		(0xE00UL)
719 #define PRIVATEER_HOTPLUG_INTERRUPT_MASK	(0xE00UL)
720 
721 	/*
722 	 * Sync the processor.
723 	 */
724 	mb();
725 	draina();
726 
727 	/*
728 	 * Only handle system events here.
729 	 */
730 	if (vector != SCB_Q_SYSEVENT)
731 		return titan_machine_check(vector, la_ptr);
732 
733 	/*
734 	 * Report the event - System Events should be reported even if no
735 	 * error is indicated since the event could indicate the return
736 	 * to normal status.
737 	 */
738 	err_print_prefix = KERN_CRIT;
739 	printk("%s*System Event (Vector 0x%x) reported on CPU %d:\n",
740 	       err_print_prefix,
741 	       (unsigned int)vector, (int)smp_processor_id());
742 	privateer_process_680_frame(mchk_header, 1);
743 	err_print_prefix = saved_err_prefix;
744 
745 	/*
746 	 * Convert any pending interrupts which report as 680 machine
747 	 * checks to interrupts.
748 	 */
749 	irqmask = tmchk->c_dirx & PRIVATEER_680_INTERRUPT_MASK;
750 
751 	/*
752 	 * Dispatch the interrupt(s).
753 	 */
754 	titan_dispatch_irqs(irqmask);
755 
756 	/*
757 	 * Release the logout frame.
758 	 */
759 	wrmces(0x7);
760 	mb();
761 }
762