Date: Thu, 20 Dec 2001 13:32:19 -0500 From: "Robin P. Blanchard" <Robin_Blanchard@gactr.uga.edu> To: stable@freebsd.org Subject: SMP kernel faulting. Message-ID: <3C222EB3.EE03334@gactr.uga.edu> References: <Pine.BSF.4.32.0112200759400.70923-100000@localhost>
next in thread | previous in thread | raw e-mail | index | archive | help
> *except from rc.conf:
> *dumpdev="/dev/amrd0s1b"
> *dumpdir="/usr/local/var/adm/crash"
> The dumpdev looks like you're dumping to your swap disk?
> The dumpdir looks wrong. Shouldn't it be to /var/adm/crash?
> My $02. -George
as it turns out:
'dumpdev="/dev/amrd0s1b"' is invalid due to the AMI megaraid not
supporting (?!?) dumping. I grabbed an old external scsi disk and set it
up as another swap and was able to get the dump (see below). The box in
question here in a Dell 4350, dual p3-600, with 3/4gig RAM. The same
kernel as uni-processor runs great (all based on a CVS grab of -STABLE
from two days ago).
This being my first attempt at debuggin a kernel, please let me know if
there is more useful information required. I'd like to get this box
running SMP again (it was an NT 4 app server for the last two years
without problems). Kernel config follows debug info
(kgdb) symbol-file kernel.debug
Reading symbols from kernel.debug...done.
(kgdb) exec-file /usr/local/var/adm/crash/kernel.0
(kgdb) core-file /usr/local/var/adm/crash/vmcore.0
SMP 2 cpus
IdlePTD at phsyical address 0x0035a000
initial pcb at physical address 0x002c7d20
panicstr: from debugger
panic messages:
---
Fatal trap 12: page fault while in kernel mode
mp_lock = 01000002; cpuid = 1; lapic.id = 00000000
fault virtual address = 0x9fdfe8c7
fault code = supervisor write, page not present
instruction pointer = 0x8:0xc01e3be8
stack pointer = 0x10:0xff80fef0
frame pointer = 0x10:0xc01e3b00
code segment = base 0x0, limit 0xfffff, type 0x1b
= DPL 0, pres 1, def32 1, gran 1
processor eflags = interrupt enabled, resume, IOPL = 0
current process = Idle
interrupt mask = net <- SMP: XXX
panic: from debugger
mp_lock = 01000002; cpuid = 1; lapic.id = 00000000
panic: from debugger
mp_lock = 01000003; cpuid = 1; lapic.id = 00000000
boot() called on cpu#1
Uptime: 1h33m31s
amr0: flushing cache...done
dumping to dev #da/0x20001, offset 3932851
dump 128 127 126 125 124 123 122 121 120 119 118 117 116 115 114 113 112
111 110 109 108 107 106 105 104 103 102 101 100 99 98 97 96 95 94 93 92
91 90 89 88 87 86 85 84 83 82 81 80 79 78 77 76 75 74 73 72 71 70 69 68
67 66 65 64 63 62 61 60 59 58 57 56 55 54 53 52 51 50 49 48 47 46 45 44
43 42 41 40 39 38 37 36 35 34 33 32 31 30 29 28 27 26 25 24 23 22 21 20
19 18 17 16 15 14 13 12 11 10 9 8 7 6 5 4 3 2 1
---
#0 dumpsys () at ../../kern/kern_shutdown.c:473
473 if (dumping++) {
(kgdb) where
#0 dumpsys () at ../../kern/kern_shutdown.c:473
#1 0xc016e49c in boot (howto=260) at ../../kern/kern_shutdown.c:313
#2 0xc016e8cd in panic (fmt=0xc026f8c4 "from debugger")
at ../../kern/kern_shutdown.c:581
#3 0xc01379f1 in db_panic (addr=-1071760408, have_addr=0, count=-1,
modif=0xff80fd54 "") at ../../ddb/db_command.c:435
#4 0xc013798f in db_command (last_cmdp=0xc02a5b04,
cmd_table=0xc02a5944,
aux_cmd_tablep=0xc02c2bf8) at ../../ddb/db_command.c:333
#5 0xc0137a56 in db_command_loop () at ../../ddb/db_command.c:457
#6 0xc0139c07 in db_trap (type=12, code=0) at ../../ddb/db_trap.c:71
#7 0xc0242750 in kdb_trap (type=12, code=0, regs=0xff80feb0)
at ../../i386/i386/db_interface.c:158
#8 0xc0256c36 in trap_fatal (frame=0xff80feb0, eva=2682251463)
at ../../i386/i386/trap.c:951
#9 0xc02568b5 in trap_pfault (frame=0xff80feb0, usermode=0,
eva=2682251463)
at ../../i386/i386/trap.c:849
#10 0xc02563fb in trap (frame={tf_fs = 24, tf_es = -8388592,
tf_ds = -1071316976, tf_edi = 1644167168, tf_esi = -1065689856,
tf_ebp = -1071760640, tf_isp = -8323364, tf_ebx = -1065689856,
tf_edx = 1711277060, tf_ecx = -744332028, tf_eax = -8323320,
tf_trapno = 12, tf_err = 2, tf_eip = -1071760408, tf_cs = 8,
tf_eflags = 66118, tf_esp = -1072124367, tf_ss = -744332064})
at ../../i386/i386/trap.c:448
---Type <return> to continue, or q <return> to quit---
#11 0xc01e3be8 in nfs_readdirrpc (vp=0xfc458908, uiop=0x8bfc758b,
cred=0x4083f845) at ../../nfs/nfs_vnops.c:2121
#12 0x408bf845 in ?? ()
cannot read proc at 0
kernel config:
options INCLUDE_CONFIG_FILE
machine i386
cpu I686_CPU
options SMP
options APIC_IO
options CPU_ENABLE_SSE
options USER_LDT
ident DUAL-4350
maxusers 32
makeoptions DEBUG=-g #Build kernel with gdb(1) debug
symbols
options DDB
#options DDB_UNATTENDED
options KTRACE #kernel tracing
options INVARIANTS
options INVARIANT_SUPPORT
options DIAGNOSTIC
options MAXMEM="(128*1024)"
options INET #InterNETworking
options FFS #Berkeley Fast Filesystem
options FFS_ROOT #FFS usable as root device [keep
this!]
options SOFTUPDATES #Enable FFS soft updates support
options UFS_DIRHASH
#options MFS #this was as SMP culprit before
?
options NFS #Network Filesystem
options NFS_NOSERVER
options MSDOSFS #MSDOS Filesystem
options CD9660 #ISO 9660 Filesystem
options PROCFS #Process filesystem
options COMPAT_43 #Compatible with BSD 4.3 [KEEP
THIS!]
options SCSI_DELAY=5000 #Delay (in ms) before probing
SCSI
options KTRACE #ktrace(1) support
options SYSVSHM #SYSV-style shared memory
options SYSVMSG #SYSV-style message queues
options SYSVSEM #SYSV-style semaphores
options SHMMAXPGS=8192
options SHMMNI=4096
options SHMSEG=1024
options P1003_1B #Posix P1003_1B real-time
extensions
options _KPOSIX_PRIORITY_SCHEDULING
options KBD_INSTALL_CDEV # install a CDEV entry in /dev
options ICMP_BANDLIM
options TCP_DROP_SYNFIN
options COMPAT_LINUX
options DEBUG_LINUX
options RANDOM_IP_ID
device isa
device pci
device amr
device ahc
device scbus
device da
device sa
device cd
device pass
device ses
device pt
# Floppy drives
device fdc0 at isa? port IO_FD1 irq 6 drq 2
device fd0 at fdc0 drive 0
# ATA and ATAPI devices
device ata0 at isa? port IO_WD1 irq 14
device ata1 at isa? port IO_WD2 irq 15
device ata
device atadisk # ATA disk drives
device atapicd # ATAPI CDROM drives
device atapifd # ATAPI floppy drives
device atapist # ATAPI tape drives
options ATA_STATIC_ID #Static device numbering
# atkbdc0 controls both the keyboard and the PS/2 mouse
device atkbdc0 at isa? port IO_KBD
device atkbd0 at atkbdc? irq 1 flags 0x1
device vga0 at isa?
options VESA
options VGA_WIDTH90
# splash screen/screen saver
pseudo-device splash
# syscons is the default console driver, resembling an SCO console
device sc0 at isa? flags 0x100
# Floating point support - do not disable.
device npx0 at nexus? port IO_NPX irq 13
# Serial (COM) ports
device sio0 at isa? port IO_COM1 flags 0x10 irq 4
options CONSPEED=115200
# PCI Ethernet NICs.
device miibus # MII bus support
device fxp # Intel EtherExpress PRO/100B (82557,
82558)
device sk
options NMBCLUSTERS=65535
# Pseudo devices - the number indicates how many units to allocated.
pseudo-device loop # Network loopback
pseudo-device ether # Ethernet support
pseudo-device tun # Packet tunnel.
pseudo-device pty # Pseudo-ttys (telnet etc)
pseudo-device md # Memory "disks"
pseudo-device gif 4 # IPv6 and IPv4 tunneling
pseudo-device gzip
pseudo-device vn
pseudo-device bpf
--
------------------------------------
Robin P. Blanchard
IT Program Specialist
Georgia Center for Continuing Ed.
fon: 706.542.2404 fax: 706.542.6546
email: Robin_Blanchard@gactr.uga.edu
------------------------------------
To Unsubscribe: send mail to majordomo@FreeBSD.org
with "unsubscribe freebsd-stable" in the body of the message
Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?3C222EB3.EE03334>
