My workstation just panicked, with panicstr: "Machine check - Hardware error".
I've checked the crash-data file, and uerf output but I can't find what was
the faulty hardware. When the machine crashed I was starting kvt (KDE X term).
Can someone help me?
#
# Crash Data Collection (Version 1.4)
#
_crash_data_collection_time: Fri Oct 16 09:45:42 GMT 1998
_current_directory: /
_crash_kernel: /var/adm/crash/vmunix.0
_crash_core: /var/adm/crash/vmcore.0
_crash_arch: alpha
_crash_os: Digital UNIX
_host_version: Digital UNIX V4.0B (Rev. 564); Fri Jul 24 13:15:47 GMT 1998
_crash_version: Digital UNIX V4.0B (Rev. 564); Fri Jul 24 13:15:47 GMT 1998
[...]
_cpu: 33
_system_string: 0xffffffffff8005c8 = "DEC 3000 - M300LX"
_ncpus: 1
_avail_cpus: 1
_partial_dump: 1
_physmem(MBytes): 160
_panic_string: 0xfffffc00004f3d68 = "Machine check - Hardware error"
_paniccpu: 0
_panic_thread: 0xfffffc00075a4840
_preserved_message_buffer_begin:
struct {
msg_magic = 0x63061
msg_bufx = 0xc30
msg_bufr = 0x5f4
msg_bufc = "Alpha boot: available memory from 0x84a000 to 0xa000000
Digital UNIX V4.0B (Rev. 564); Fri Jul 24 13:15:47 GMT 1998
physical memory = 160.00 megabytes.
available memory = 151.76 megabytes.
using 606 buffers containing 4.73 megabytes of memory
tc0 at nexus
tcds0 at tc0 slot 4
scsi0 at tcds0 slot 0
rz3 at scsi0 target 3 lun 0 (LID=0) (DEC RZ26L (C) DEC 440C)
ln0: DEC LANCE Module Name: PMAD-BA
ln0 at tc0 slot 5
ln0: DEC LANCE Ethernet Interface, hardware address: 08-00-2B-3F-BB-3F
scc0 at tc0 slot 5
bba0 at tc0 slot 5
fb0 at tc0 slot 6
1280X1024
ln1: DEC LANCE Module Name: PMAD-AA
ln1 at tc0 slot 0
ln1: DEC LANCE Ethernet Interface, hardware address: 08-00-2B-9A-2F-43
DEC 3000 - M300LX system
Firmware revision: 6.9
PALcode: OSF version 1.45
dli: configured
Node ID is 08-00-2b-3f-bb-3f (from device ln0)
dna_netman: configured
Node UID is 1a2cde20-5c30-11d2-9f0f-08002b3fbb3f
dna_dli: configured
dna_base: configured
dna_xti: configured
SuperLAT. Copyright 1994 Meridian Technology Corp. All rights reserved.
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
ln1: lost carrier: check connector
NFS3 server guepard not responding still trying
NFS3 server guepard ok
NFS3 server guepard not responding still trying
NFS3 server guepard ok
NFS3 write error 28 on host guepard
MACHINE CHECK type 0x660 Machine check abort
ptr[0-1] = 0000000100000092 000003ffbff47e21
ptr[2-3] = 001182f800000004 3254325469325463
ptr[4-5] = 0000000000000000 000000000000ff00
ptr[6-7] = 000003ff80005c58 0000000000104000
ptr[8-9] = 0000000000000000 0000000000000008
ptr[10-11] = fffffc00003d7590 0000000000000000
ptr[12-13] = fffffc00003d7930 fffffc00003d7960
ptr[14-15] = fffffc00003d79c0 fffffc00003d7730
ptr[16-17] = fffffc00003d7400 0000000000000000
ptr[18-19] = 000000011fffda90 ffffffff8b13ba38
ptr[20-21] = fffffc000050e340 0000000000000000
ptr[22-23] = 6068686c7c7c7c7c 000000690000087e
ptr[24-25] = 0000000000000000 0000000000010000
ptr[26-27] = 000000000de42002 0000000000000000
ptr[28-29] = 0000000005518000 fffffffc00000000
ptr[30-31] = 0000000000000001 0000000003ea3a38
exc_addr = 000003ff80005bae
exc_sum = 0000000000000000
exc_mask = 0000000000000000
iccsr = 0000000000000000
pal_base = 0000000000060000
hier = 00000000000018f0
hirr = 0000000000000000
mm_csr = 00000000000050e0
dc_stat = 0000000000000007
dc_addr = 00000007ffffffff
abox_ctl = 000000000000042e
biu_stat = 0000000000003440
biu_addr = 000000000212fe20
biu_ctl = 0000000e10006335
fill_syndrome = 0000000000000080
fill_addr = 000000000212fe20
va = 00000000001081e8
bc_tag = 0000000000408cd4
ident = 92
mcr_stat = ffffffff80808080
intr = 00000000
tc_status = 00000000
config = 00000003
panic (cpu 0): Machine check - Hardware error
syncing disks... DUMP.prom: dev SCSI 0 4 0 0 300 0 FLAMG-IO, block 131072
DUMP.prom: dev SCSI 0 4 0 0 300 0 FLAMG-IO, block 131072
"
}
_preserved_message_buffer_end:
_kernel_process_status_begin:
PID COMM
00000 kernel idle
00001 init
00003 kloadsrv
29827 kvt
[102 other processes]
_kernel_process_status_end:
_current_pid: 29827
_current_tid: 0xfffffc00075a4840
_proc_thread_list_begin:
thread 0xfffffc00075a4840 stopped at [boot:2466 ,0xfffffc00003dba08] Source not available
_proc_thread_list_end:
_dump_begin:
> 0 boot(0x400000000, 0x1, 0xfffffc0000280954, 0xfffffc00004d4160, 0xfffffc00004d4160) ["../../../../src/kernel/arch/alpha/machdep.c":2466, 0xfffffc00003dba08]
1 panic(s = 0xfffffc00004d6350 = "thread_block: interrupt level call") ["../../../../src/kernel/bsd/subr_prf.c":707, 0xfffffc000027f01c]
pcpu = 0xfffffc000052f8c0
i = 5071696
mycpu = 0
spl = 5
2 thread_block() ["../../../../src/kernel/kern/sched_prim.c":1925, 0xfffffc00002ac590]
thread = 0xfffffc00075a4840
new_thread = 0xfffffc00075a4840
mycpu = 0
myprocessor = 0xfffffc0000200100
s = 5
pset = 0x1000
3 thread_preempt(thread = 0x26, processor = 0xfffffc0000200100) ["../../../../src/kernel/kern/sched_prim.c":3820, 0xfffffc00002af124]
s = 2
pset = 0x1
4 boot(0x0, 0xfffffc00075a4840, 0x2c0000002c, 0x2d, 0x1) ["../../../../src/kernel/arch/alpha/machdep.c":2410, 0xfffffc00003db8f0]
5 panic(s = 0xfffffc00004f3d68 = "Machine check - Hardware error") ["../../../../src/kernel/bsd/subr_prf.c":791, 0xfffffc000027f1bc]
pcpu = 0xfffffc000052f8c0
i = 5301056
mycpu = 0
spl = 7
6 machcheck(0x0, 0xfffffc0000236f51, 0x1, 0xde42002, 0x4d) ["../../../../src/kernel/arch/alpha/hal/kn16aa.c":1393, 0xfffffc0000407ef0]
7 mach_error(0x1, 0xde42002, 0x4d, 0x3ff80008bdc, 0xfffffc00003d76a0) ["../../../../src/kernel/arch/alpha/hal/cpusw.c":808, 0xfffffc00003ec8e8]
8 _XentInt(0x8, 0x3ff80005bac, 0x3ffc000a7d0, 0x3ffbff47e21, 0x4d) ["../../../../src/kernel/arch/alpha/locore.s":1112, 0xfffffc00003d769c]
_dump_end:
[...]
_savedefp: (nil)
_kernel_memory_fault_data_begin:
struct {
fault_va = 0x0
fault_pc = 0x0
fault_ra = 0x0
fault_sp = 0x0
access = 0x0
status = 0x0
cpunum = 0x0
count = 0x0
pcb = (nil)
thread = (nil)
task = (nil)
proc = (nil)
}
_kernel_memory_fault_data_end:
_uptime: 264.88 hours
paniccpu: 0x0
machine_slot[paniccpu]: struct {
is_cpu = 0x1
cpu_type = 0xf
cpu_subtype = 0x7
running = 0x1
cpu_ticks = {
[0] 0x10916fa
[1] 0xc5e68
[2] 0x1cdb4f0
[3] 0x3745218f
[4] 0xbe21f
}
clock_freq = 0x400
error_restart = 0x0
cpu_panicstr = 0xfffffc00004f3d68 = "Machine check - Hardware error"
cpu_panic_thread = 0xfffffc00075a4840
}
tset machine_slot[paniccpu].cpu_panic_thread:
Begin Trace for machine_slot[paniccpu].cpu_panic_thread:
> 0 boot(0x400000000, 0x1, 0xfffffc0000280954, 0xfffffc00004d4160, 0xfffffc00004d4160) ["../../../../src/kernel/arch/alpha/machdep.c":2466, 0xfffffc00003dba08]
1 panic(s = 0xfffffc00004d6350 = "thread_block: interrupt level call") ["../../../../src/kernel/bsd/subr_prf.c":707, 0xfffffc000027f01c]
2 thread_block() ["../../../../src/kernel/kern/sched_prim.c":1925, 0xfffffc00002ac590]
3 thread_preempt(thread = 0x26, processor = 0xfffffc0000200100) ["../../../../src/kernel/kern/sched_prim.c":3820, 0xfffffc00002af124]
4 boot(0x0, 0xfffffc00075a4840, 0x2c0000002c, 0x2d, 0x1) ["../../../../src/kernel/arch/alpha/machdep.c":2410, 0xfffffc00003db8f0]
5 panic(s = 0xfffffc00004f3d68 = "Machine check - Hardware error") ["../../../../src/kernel/bsd/subr_prf.c":791, 0xfffffc000027f1bc]
6 machcheck(0x0, 0xfffffc0000236f51, 0x1, 0xde42002, 0x4d) ["../../../../src/kernel/arch/alpha/hal/kn16aa.c":1393, 0xfffffc0000407ef0]
7 mach_error(0x1, 0xde42002, 0x4d, 0x3ff80008bdc, 0xfffffc00003d76a0) ["../../../../src/kernel/arch/alpha/hal/cpusw.c":808, 0xfffffc00003ec8e8]
8 _XentInt(0x8, 0x3ff80005bac, 0x3ffc000a7d0, 0x3ffbff47e21, 0x4d) ["../../../../src/kernel/arch/alpha/locore.s":1112, 0xfffffc00003d769c]
End Trace for machine_slot[paniccpu].cpu_panic_thread:
"cpu_data" is not an array
_stack_trace[0]_begin:
> 0 boot(0x400000000, 0x1, 0xfffffc0000280954, 0xfffffc00004d4160, 0xfffffc00004d4160) ["../../../../src/kernel/arch/alpha/machdep.c":2466, 0xfffffc00003dba08]
1 panic(s = 0xfffffc00004d6350 = "thread_block: interrupt level call") ["../../../../src/kernel/bsd/subr_prf.c":707, 0xfffffc000027f01c]
2 thread_block() ["../../../../src/kernel/kern/sched_prim.c":1925, 0xfffffc00002ac590]
3 thread_preempt(thread = 0x26, processor = 0xfffffc0000200100) ["../../../../src/kernel/kern/sched_prim.c":3820, 0xfffffc00002af124]
4 boot(0x0, 0xfffffc00075a4840, 0x2c0000002c, 0x2d, 0x1) ["../../../../src/kernel/arch/alpha/machdep.c":2410, 0xfffffc00003db8f0]
5 panic(s = 0xfffffc00004f3d68 = "Machine check - Hardware error") ["../../../../src/kernel/bsd/subr_prf.c":791, 0xfffffc000027f1bc]
6 machcheck(0x0, 0xfffffc0000236f51, 0x1, 0xde42002, 0x4d) ["../../../../src/kernel/arch/alpha/hal/kn16aa.c":1393, 0xfffffc0000407ef0]
7 mach_error(0x1, 0xde42002, 0x4d, 0x3ff80008bdc, 0xfffffc00003d76a0) ["../../../../src/kernel/arch/alpha/hal/cpusw.c":808, 0xfffffc00003ec8e8]
8 _XentInt(0x8, 0x3ff80005bac, 0x3ffc000a7d0, 0x3ffbff47e21, 0x4d) ["../../../../src/kernel/arch/alpha/locore.s":1112, 0xfffffc00003d769c]
_stack_trace[0]_end:
_kdbx_proc_start:
Addr PID PPID PGRP UID NICE SIGCATCH P_SIG Event Flags
=========== ===== ===== ===== ===== ==== ======== ======== =========== ============
k0x09f6aca0 0 0 0 0 0 00000000 00000000 NULL in sys
k0x09f6b720 1 0 1 0 0 307a62ff 00000000 NULL in contign pagv
k0x09e54ca0 3 1 3 0 0 00004000 00000000 NULL in pagv
k0x05ea2ca0 29827 29802 17381 1731 0 00000000 00000000 NULL in pagv ctty
[...]
_kdbx_proc_end:
_crash_data_collection_finished:
#
# Output of uerf
#
******************************* ENTRY 75. *******************************
----- EVENT INFORMATION -----
EVENT CLASS ERROR EVENT
OS EVENT TYPE 100. CPU EXCEPTION
SEQUENCE NUMBER 1.
OPERATING SYSTEM DEC OSF/1
OCCURRED/LOGGED ON Fri Oct 16 09:40:16 1998
OCCURRED ON SYSTEM bleriot
SYSTEM ID x00020007 CPU TYPE: DEC 3000
SYSTYPE x00000000
----- UNIT INFORMATION -----
UNIT CLASS CPU
******************************* ENTRY 76. *******************************
----- EVENT INFORMATION -----
EVENT CLASS ERROR EVENT
OS EVENT TYPE 302. PANIC
SEQUENCE NUMBER 2.
OPERATING SYSTEM DEC OSF/1
OCCURRED/LOGGED ON Fri Oct 16 09:40:16 1998
OCCURRED ON SYSTEM bleriot
SYSTEM ID x00020007 CPU TYPE: DEC 3000
SYSTYPE x00000000
MESSAGE panic (cpu 0): Machine check -
_Hardware error
--
Christian Biache <biache_at_fr.airsysatm.thomson-csf.com>
AIRSYS ATM - 19, rue de la Fontaine - 92223 Bagneux CEDEX - France
Received on Fri Oct 16 1998 - 09:01:29 NZDT