Skip site navigation (1)Skip section navigation (2)
Date:      Sun, 30 May 2004 15:52:04 -0400
From:      Don Bowman <don@sandvine.com>
To:        "'current@freebsd.org'" <current@freebsd.org>
Subject:   hang with raid, postgresql
Message-ID:  <FE045D4D9F7AED4CBFF1B3B813C85337051D8DE4@mail.sandvine.com>

next in thread | raw e-mail | index | archive | help
This message is in MIME format. Since your mail reader does not understand
this format, some or all of this message may not be legible.

------_=_NextPart_000_01C4467F.951AA9C0
Content-Type: text/plain;
	charset="iso-8859-1"


I have a system with 2x 2.8GHz XEON (P4), intel e7501 chipset, 
4GB of ram, aac [adaptec 2200s] raid with 4 scsi
disks. I have also tried asr (adaptec 2015).
I have tried two different motherboards.
The only application the machine runs is postgresql,
with about ~30 databases, about ~250GB of data.

I'm finding the machine locks up solid once a day
or so (sometimes more, sometimes less, no pattern
of time of day). I know its not a hardware issue, it 
is reliable with FreeBSD 4.7. I've run through memory 
test, disk test, etc.

There appears to be a correlation between
disk activity (postgresql vacuum) and the lockup,
but i can't be sure.

I've just reproduced it with a cvsup from head today
[2004-05-30 12:00 EDT], so its still present.
I've got a serial console, and the break to 
debugger (which works under normal circumstances).

In the lockup case, i cannot drop into db, and
no output appears anywhere. I have enabled
the following options, but still no affect, no
messages come out (other than erroneous LOR
issues).

options         ALT_BREAK_TO_DEBUGGER
options         DDB            
options         INVARIANTS     
options         INVARIANT_SUPPORT 
options         WITNESS
options         WITNESS_SKIPSPIN
options         MUTEX_DEBUG
options         DIAGNOSTIC

i've tried both with and without ACPI. It
does not have PAE configured in.

The fact that i can't drop into the debugger
using the CR ~ ^B sequence when its locked up
implies that its no longer servicing the serial
interrupt.

Does anyone have any suggestions? postgresql
makes use of disk, sysv semaphores, shared memory,
etc.

I don't have sound, vga, X, ... any of the
'complicated' things, its just a server.
There is no ATA.

I tried setting kern.smp.active to 0, but
it still locked up.

I'm looking for any suggestions. I have 
attached the config file from it if anyone
has any comments on that.

--don



------_=_NextPart_000_01C4467F.951AA9C0
Content-Type: application/octet-stream;
	name="CDATA"
Content-Transfer-Encoding: quoted-printable
Content-Disposition: attachment;
	filename="CDATA"

machine		i386=0A=
cpu		I686_CPU=0A=
ident		CDATA=0A=
=0A=
makeoptions	DEBUG=3D-g		#Build kernel with gdb(1) debug symbols=0A=
=0A=
options 	SCHED_4BSD		#4BSD scheduler=0A=
options 	INET			#InterNETworking=0A=
options 	INET6			#IPv6 communications protocols=0A=
options 	FFS			#Berkeley Fast Filesystem=0A=
options 	SOFTUPDATES		#Enable FFS soft updates support=0A=
options 	UFS_ACL			#Support for access control lists=0A=
options 	UFS_DIRHASH		#Improve performance on big directories=0A=
options 	MD_ROOT			#MD is a potential root device=0A=
options 	NFSCLIENT		#Network Filesystem Client=0A=
options 	NFSSERVER		#Network Filesystem Server=0A=
options 	NFS_ROOT		#NFS usable as /, requires NFSCLIENT=0A=
options 	MSDOSFS			#MSDOS Filesystem=0A=
options 	CD9660			#ISO 9660 Filesystem=0A=
options 	PROCFS			#Process filesystem (requires PSEUDOFS)=0A=
options 	PSEUDOFS		#Pseudo-filesystem framework=0A=
options 	COMPAT_43		#Compatible with BSD 4.3 [KEEP THIS!]=0A=
options 	COMPAT_FREEBSD4		#Compatible with FreeBSD4=0A=
options 	SCSI_DELAY=3D1000		#Delay (in ms) before probing SCSI=0A=
options 	KTRACE			#ktrace(1) support=0A=
options 	SYSVSHM			#SYSV-style shared memory=0A=
options 	SYSVMSG			#SYSV-style message queues=0A=
options 	SYSVSEM			#SYSV-style semaphores=0A=
options 	_KPOSIX_PRIORITY_SCHEDULING #Posix P1003_1B real-time =
extensions=0A=
options 	KBD_INSTALL_CDEV	# install a CDEV entry in /dev=0A=
options 	AHC_REG_PRETTY_PRINT	# Print register bitfields in debug=0A=
					# output.  Adds ~128k to driver.=0A=
options 	AHD_REG_PRETTY_PRINT	# Print register bitfields in debug=0A=
					# output.  Adds ~215k to driver.=0A=
options 	PFIL_HOOKS		# pfil(9) framework=0A=
=0A=
# Debugging for use in -current=0A=
options 	DDB			#Enable the kernel debugger=0A=
options 	INVARIANTS		#Enable calls of extra sanity checking=0A=
options 	INVARIANT_SUPPORT	#Extra sanity checks of internal structures, =
required by INVARIANTS=0A=
options 	WITNESS			#Enable checks to detect deadlocks and cycles=0A=
options 	WITNESS_SKIPSPIN	#Don't run witness on spinlocks for speed=0A=
options         MUTEX_DEBUG=0A=
options         DIAGNOSTIC=0A=
=0A=
=0A=
=0A=
# To make an SMP kernel, the next two are needed=0A=
options 	SMP			# Symmetric MultiProcessor Kernel=0A=
device		apic			# I/O APIC=0A=
=0A=
device		isa=0A=
device		eisa=0A=
device		pci=0A=
=0A=
# Floppy drives=0A=
device		fdc=0A=
=0A=
# ATA and ATAPI devices=0A=
device		ata=0A=
device		atadisk			# ATA disk drives=0A=
device		ataraid			# ATA RAID drives=0A=
device		atapicd			# ATAPI CDROM drives=0A=
device		atapifd			# ATAPI floppy drives=0A=
device		atapist			# ATAPI tape drives=0A=
options 	ATA_STATIC_ID		#Static device numbering=0A=
=0A=
# SCSI Controllers=0A=
device		ahd		# AHA39320/29320 and onboard AIC79xx devices=0A=
# SCSI peripherals=0A=
device		scbus		# SCSI bus (required for SCSI)=0A=
device		ch		# SCSI media changers=0A=
device		da		# Direct Access (disks)=0A=
device		sa		# Sequential Access (tape etc)=0A=
device		cd		# CD=0A=
device		pass		# Passthrough device (direct SCSI access)=0A=
device		ses		# SCSI Environmental Services (and SAF-TE)=0A=
=0A=
# RAID controllers interfaced to the SCSI subsystem=0A=
device		asr		# DPT SmartRAID V, VI and Adaptec SCSI RAID=0A=
device		ciss		# Compaq Smart RAID 5*=0A=
device		dpt		# DPT Smartcache III, IV - See NOTES for options=0A=
device		iir		# Intel Integrated RAID=0A=
device		ips		# IBM (Adaptec) ServeRAID=0A=
device		mly		# Mylex AcceleRAID/eXtremeRAID=0A=
device		aac		# Adaptec FSA RAID=0A=
device		amr		# Adaptec FSA RAID=0A=
device		aacp		# SCSI passthrough for aac (requires CAM)=0A=
device		ida		# Compaq Smart RAID=0A=
device		mlx		# Mylex DAC960 family=0A=
device		pst		# Promise Supertrak SX6000=0A=
device		twe		# 3ware ATA RAID=0A=
=0A=
# atkbdc0 controls both the keyboard and the PS/2 mouse=0A=
device		atkbdc		# AT keyboard controller=0A=
device		atkbd		# AT keyboard=0A=
device		psm		# PS/2 mouse=0A=
=0A=
device		vga		# VGA video card driver=0A=
=0A=
device		splash		# Splash screen and screen saver support=0A=
=0A=
# syscons is the default console driver, resembling an SCO console=0A=
device		sc=0A=
=0A=
# Enable this for the pcvt (VT220 compatible) console driver=0A=
#device		vt=0A=
#options 	XSERVER			# support for X server on a vt console=0A=
#options 	FAT_CURSOR		# start with block cursor=0A=
=0A=
device		agp		# support several AGP chipsets=0A=
=0A=
# Floating point support - do not disable.=0A=
device		npx=0A=
=0A=
# Power management support (see NOTES for more options)=0A=
#device		apm=0A=
# Add suspend/resume support for the i8254.=0A=
device		pmtimer=0A=
=0A=
# PCCARD (PCMCIA) support=0A=
# Pcmcia and cardbus bridge support=0A=
device		cbb			# cardbus (yenta) bridge=0A=
#device		pcic			# ExCA ISA and PCI bridges=0A=
device		pccard			# PC Card (16-bit) bus=0A=
device		cardbus			# CardBus (32-bit) bus=0A=
=0A=
# Serial (COM) ports=0A=
device		sio		# 8250, 16[45]50 based serial ports=0A=
=0A=
# PCI Ethernet NICs.=0A=
device		em		# Intel PRO/1000 adapter Gigabit Ethernet Card=0A=
=0A=
# PCI Ethernet NICs that use the common MII bus controller code.=0A=
# NOTE: Be sure to keep the 'device miibus' line in order to use these =
NICs!=0A=
device		miibus		# MII bus support=0A=
device		bfe		# Broadcom BCM440x 10/100 ethernet=0A=
device		bge		# Broadcom BCM570xx Gigabit Ethernet=0A=
device		fxp		# Intel EtherExpress PRO/100B (82557, 82558)=0A=
device		xl		# 3Com 3c90x (``Boomerang'', ``Cyclone'')=0A=
=0A=
# Pseudo devices - the number indicates how many units to allocate.=0A=
device		random		# Entropy device=0A=
device		loop		# Network loopback=0A=
device		ether		# Ethernet support=0A=
device		tun		# Packet tunnel.=0A=
device		pty		# Pseudo-ttys (telnet etc)=0A=
device		md		# Memory "disks"=0A=
device		gif		# IPv6 and IPv4 tunneling=0A=
device		faith		# IPv6-to-IPv4 relaying (translation)=0A=
=0A=
# The `bpf' device enables the Berkeley Packet Filter.=0A=
# Be aware of the administrative consequences of enabling this!=0A=
device		bpf		# Berkeley packet filter=0A=
=0A=
# USB support=0A=
device		uhci		# UHCI PCI->USB interface=0A=
device		ohci		# OHCI PCI->USB interface=0A=
device		usb		# USB Bus (required)=0A=
#device		udbp		# USB Double Bulk Pipe devices=0A=
device		ugen		# Generic=0A=
device		uhid		# "Human Interface Devices"=0A=
device		ukbd		# Keyboard=0A=
device		ulpt		# Printer=0A=
device		umass		# Disks/Mass storage - Requires scbus and da=0A=
device		ums		# Mouse=0A=
device		urio		# Diamond Rio 500 MP3 player=0A=
device		uscanner	# Scanners=0A=
# USB Ethernet, requires mii=0A=
device		aue		# ADMtek USB ethernet=0A=
device		axe		# ASIX Electronics USB ethernet=0A=
device		cue		# CATC USB ethernet=0A=
device		kue		# Kawasaki LSI USB ethernet=0A=
=0A=
options 	ALT_BREAK_TO_DEBUGGER=0A=
options 	DDB_UNATTENDED=0A=
=0A=
options 	MAXDSIZ=3D(1536UL*1024*1024)=0A=
options 	MAXSSIZ=3D(128UL*1024*1024)=0A=
options 	DFLDSIZ=3D(1024UL*1024*1024)=0A=
options 	INCLUDE_CONFIG_FILE     # Include this file in kernel=0A=
device		gre			#IP over IP tunneling=0A=
options 	IPFIREWALL		#firewall=0A=
options 	IPFIREWALL_DEFAULT_TO_ACCEPT	#allow everything by default=0A=
options 	HZ=3D1000=0A=
options 	SES_ENABLE_PASSTHROUGH=0A=
device		smbus		# Bus support, required for smb below.=0A=
device		smb=0A=
device		ichsmb=0A=
options 	SEMMNS=3D256=0A=
options 	SEMMNI=3D128=0A=
options 	SEMMSL=3D128=0A=
=0A=
options         CONSPEED=3D115200 =0A=
#option	       VM_KMEM_SIZE_SCALE=3D2=0A=
options         VM_KMEM_SIZE_MAX=3D419430400=0A=
options         CPU_ENABLE_SSE=0A=
=0A=
options	CPU_ENABLE_TCC=0A=

------_=_NextPart_000_01C4467F.951AA9C0--



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?FE045D4D9F7AED4CBFF1B3B813C85337051D8DE4>