I just got an SMP lockup running qa 013 with yesterday's t-o-t.
Unfortunately I haven't been able to reproduce it. I'm pretty sure
the stress being run was:
fsstress -v -p 5 -r -n 1000
Here's the kdb info:
[1]kdb> cpu 0
Entering kdb (0xf4fe6000) on processor 0 due to cpu switch
[0]kdb> bt
EBP EIP Function(args)
0xc01f797a stext_lock+0x1a32
kernel .text.lock 0xc01f5f48 0xc01f5f48
0xc01fbca0
0xf4fe7dac 0xc0132c1e insert_into_queues+0x5e (0xf750c180, 0xf750c180,
0xc013314c, 0x0)
kernel .text 0xc0100000 0xc0132bc0 0xc0132c80
0xf4fe7dd8 0xc013335c getblk+0xa0 (0x100, 0xccf, 0x400)
kernel .text 0xc0100000 0xc01332bc 0xc013338c
0xf4fe7df8 0xc016da3d rd_request+0xad (0xc033c128)
kernel .text 0xc0100000 0xc016d990 0xc016dac0
0xf4fe7e08 0xc0164ab7 generic_unplug_device+0x2f (0xc033c128)
kernel .text 0xc0100000 0xc0164a88 0xc0164ac8
0xf4fe7e18 0xf89049a2 [xfs]xfs_trigger_io+0x5a
xfs .text 0xf888e060 0xf8904948 0xf89049b0
0xf4fe7e4c 0xf88d9086 [xfs]xlog_sync+0x2c6 (0xf5eaf8e0, 0xf5390000, 0x0)
xfs .text 0xf888e060 0xf88d8dc0 0xf88d92dc
0xf4fe7e80 0xf88da9e9 [xfs]xlog_state_release_iclog+0x121 (0xf5eaf8e0,
0xf5390000)
xfs .text 0xf888e060 0xf88da8c8 0xf88da9f4
0xf4fe7eac 0xf88dabd5 [xfs]xlog_state_sync_all+0xf5 (0xf5eaf8e0, 0x2)
xfs .text 0xf888e060 0xf88daae0 0xf88dac9c
0xf4fe7ec8 0xf88d7ca7 [xfs]xfs_log_force+0x77 (0xf4699000, 0x0, 0x0, 0x2)
xfs .text 0xf888e060 0xf88d7c30 0xf88d7cd4
0xf4fe7f50 0xf88f122f [xfs]xfs_syncsub+0xeb (0xf4699000, 0x31, 0x0, 0x0,
0xf4699000)
xfs .text 0xf888e060 0xf88f1144 0xf88f2404
0xf4fe7f70 0xf88f113b [xfs]xfs_sync+0x1b (0xf4699000, 0x31, 0xf8920f80)
xfs .text 0xf888e060 0xf88f1120 0xf88f1144
0xf4fe7f88 0xf8906304 [xfs]linvfs_write_super+0x24 (0xf53bde00)
xfs .text 0xf888e060 0xf89062e0 0xf8906310
0xf4fe7f9c 0xc0136578 sync_supers+0x6c (0x0)
kernel .text 0xc0100000 0xc013650c 0xc01365a0
0xf4fe7fb0 0xc0132844 fsync_dev+0x3c (0x0)
kernel .text 0xc0100000 0xc0132808 0xc013289c
0xf4fe7fbc 0xc01328a6 sys_sync+0xa (0x804ec68, 0xdd4176f0, 0x22be890f,
0x4000ae60, 0xbffff984)
kernel .text 0xc0100000 0xc013289c 0xc01328ac
0xc0109040 system_call+0x34
kernel .text 0xc0100000 0xc010900c 0xc0109044
[0]kdb>
[0]kdb> cpu 1
Entering kdb (0xf42ca000) on processor 1 due to cpu switch
[1]kdb> bt
EBP EIP Function(args)
0xc01fa1ea stext_lock+0x42a2
kernel .text.lock 0xc01f5f48 0xc01f5f48
0xc01fbca0
0xf42cbef4 0xc01aa38e sym53c8xx_intr+0x62 (0x39, 0xf7cd6000, 0xf42cbf44,
0x720, 0xc0317f20)
kernel .text 0xc0100000 0xc01aa32c 0xc01aa3cc
0xf42cbf14 0xc010ab39 handle_IRQ_event+0x4d (0x39, 0xf42cbf44, 0xf7f80b00,
0x632, 0xefd60ae0)
kernel .text 0xc0100000 0xc010aaec 0xc010ab68
0xf42cbf3c 0xc010ad39 do_IRQ+0x99
kernel .text 0xc0100000 0xc010aca0 0xc010ad8c
0xc0109100 ret_from_intr
kernel .text 0xc0100000 0xc0109100 0xc0109120
Interrupt registers:
eax = 0xefd60a80 ebx = 0x00000632 ecx = 0xefdf26c0 edx = 0xefdf26c0
esi = 0xefd60ae0 edi = 0x00000000 esp = 0xf42cbf78 eip = 0xc0132653
ebp = 0xf42cbf98 ss = 0x00000018 cs = 0x00000010 eflags = 0x00000246
ds = 0xf6a60018 es = 0xf6a60018 origeax = 0xffffff39 ®s = 0xf42cbf44
0xc0132653 sync_buffers+0x83 (0x0, 0x0)
kernel .text 0xc0100000 0xc01325d0 0xc01327dc
0xf42cbfb0 0xc0132819 fsync_dev+0x11 (0x0)
kernel .text 0xc0100000 0xc0132808 0xc013289c
0xf42cbfbc 0xc01328a6 sys_sync+0xa (0x804ec68, 0xdd4176f0, 0x22be890f,
0x4000ae60, 0xbffff984)
kernel .text 0xc0100000 0xc013289c 0xc01328ac
0xc0109040 system_call+0x34
[1]more>
kernel .text 0xc0100000 0xc010900c 0xc0109044
[1]kdb>
[1]kdb> ps
Task Addr Pid Parent [*] cpu State Thread Command
0xf7fb2000 00000001 00000000 0 001 stop 0xf7fb2340 init
0xf7f8c000 00000002 00000001 0 001 stop 0xf7f8c340 kswapd
0xf7f8a000 00000003 00000001 0 001 stop 0xf7f8a340 kflushd
0xf7f88000 00000004 00000001 0 001 stop 0xf7f88340 kupdate
0xf5c60000 00000350 00000001 0 000 stop 0xf5c60340 portmap
0xf6702000 00000429 00000001 0 000 stop 0xf6702340 rpciod
0xf645a000 00000430 00000001 0 000 stop 0xf645a340 lockd
0xf56fa000 00000453 00000001 0 000 stop 0xf56fa340 syslogd
0xf6806000 00000465 00000001 0 000 run 0xf6806340 klogd
0xf68c0000 00000482 00000001 0 001 stop 0xf68c0340 identd
0xf5c0e000 00000484 00000482 0 001 stop 0xf5c0e340 identd
0xf6646000 00000485 00000484 0 001 stop 0xf6646340 identd
0xf5a60000 00000486 00000484 0 001 stop 0xf5a60340 identd
0xf5e94000 00000487 00000484 0 001 stop 0xf5e94340 identd
0xf5dd6000 00000503 00000001 0 001 stop 0xf5dd6340 atd
0xf57c6000 00000520 00000001 0 000 stop 0xf57c6340 crond
0xf65f4000 00000537 00000001 0 000 stop 0xf65f4340 inetd
0xf5a56000 00000648 00000001 0 000 stop 0xf5a56340 pmcd
0xf5ea0000 00000801 00000001 0 000 stop 0xf5ea0340 pmlogger
0xf5ad2000 00000851 00000001 0 000 stop 0xf5ad2340 minilogd
0xf6986000 00000867 00000001 0 000 stop 0xf6986340 mingetty
0xf609e000 00000868 00000001 0 000 stop 0xf609e340 mingetty
[1]more>
0xf5952000 00000869 00000001 0 000 stop 0xf5952340 mingetty
0xf574e000 00000870 00000001 0 001 stop 0xf574e340 mingetty
0xf56ca000 00000871 00000001 0 001 stop 0xf56ca340 mingetty
0xf69fc000 00000872 00000001 0 001 stop 0xf69fc340 mingetty
0xf64f8000 00000873 00000001 0 000 stop 0xf64f8340 login
0xf5eb2000 00000898 00000873 0 001 stop 0xf5eb2340 tcsh
0xf556e000 00001497 00000001 0 000 stop 0xf556e340 pagebuf_daemon
0xf55ba000 00001498 00000001 0 000 stop 0xf55ba340 page_daemon
0xf32fa000 00007853 00000898 0 000 stop 0xf32fa340 check
0xf361c000 00008084 00007853 0 000 stop 0xf361c340 sh
0xf2e70000 00008138 00008084 0 000 stop 0xf2e70340 fsstress
0xf42ca000 00008139 00008138 1 001 run 0xf42ca340*fsstress
0xf1e78000 00008140 00008138 0 001 stop 0xf1e78340 fsstress
0xe4092000 00008141 00008138 0 000 stop 0xe4092340 fsstress
0xf4044000 00008142 00008138 0 001 run 0xf4044340 fsstress
0xf4fe6000 00008143 00008138 1 000 run 0xf4fe6340 fsstress
[1]kdb> btp 8139
EBP EIP Function(args)
0xc01fa1ea stext_lock+0x42a2
kernel .text.lock 0xc01f5f48 0xc01f5f48
0xc01fbca0
0xf7f80b00 0xc01aa38e sym53c8xx_intr+0x62 (0x39, 0xf7cd6000, 0xf42cbf44,
0x720, 0xc0317f20)
kernel .text 0xc0100000 0xc01aa32c 0xc01aa3cc
0xf42cbf14 0xc010ab39 handle_IRQ_event+0x4d (0x39, 0xf42cbf44, 0xf7f80b00,
0x632, 0xefd60ae0)
kernel .text 0xc0100000 0xc010aaec 0xc010ab68
0xf42cbf3c 0xc010ad39 do_IRQ+0x99
kernel .text 0xc0100000 0xc010aca0 0xc010ad8c
0xc0109100 ret_from_intr
kernel .text 0xc0100000 0xc0109100 0xc0109120
Interrupt registers:
eax = 0xefd60a80 ebx = 0x00000632 ecx = 0xefdf26c0 edx = 0xefdf26c0
esi = 0xefd60ae0 edi = 0x00000000 esp = 0xf42cbf78 eip = 0xc0132653
ebp = 0xf42cbf98 ss = 0x00000018 cs = 0x00000010 eflags = 0x00000246
ds = 0xf6a60018 es = 0xf6a60018 origeax = 0xffffff39 ®s = 0xf42cbf44
0xc0132653 sync_buffers+0x83 (0x0, 0x0)
kernel .text 0xc0100000 0xc01325d0 0xc01327dc
0xf42cbfb0 0xc0132819 fsync_dev+0x11 (0x0)
kernel .text 0xc0100000 0xc0132808 0xc013289c
0xf42cbfbc 0xc01328a6 sys_sync+0xa (0x804ec68, 0xdd4176f0, 0x22be890f,
0x4000ae60, 0xbffff984)
kernel .text 0xc0100000 0xc013289c 0xc01328ac
0xc0109040 system_call+0x34
kernel .text 0xc0100000 0xc010900c 0xc0109044
-----------------------------------------------------
Daniel Moore dxm@xxxxxxx
R&D Software Engineer Phone: +61-3-98348209
SGI Performance Tools Group Fax: +61-3-98132378
-----------------------------------------------------
|