Re: snapshot dump hangs

From: Randy Bush <randy_at_psg.com>
Date: Wed, 9 Jun 2004 07:10:04 -0700
> (1) Could you do a "ps awxl" and see what wait channel dump is blocked on?

ps -l | grep dump

  UID   PID  PPID CPU PRI NI   VSZ  RSS MWCHAN STAT  TT       TIME COMMAND
  ...
    0  1745  1701   0   8  0  1496 1220 wait   S+    p0    0:00.01 /sbin/rdump 0Luaf raid0.psg.com:/data/backup/psg.2004-06-09/var /dev/twed0s1d (rdump)
    0  1748  1745   0   4  0  1624 1268 sbwait S+    p0    0:02.55 rdump: /dev/twed0s1d: pass 4: 60.19% done, finished in 0:00 (rdump)
    0  1749  1748   0  20  0  1496 1220 pause  S+    p0    0:03.99 /sbin/rdump 0Luaf raid0.psg.com:/data/backup/psg.2004-06-09/var /dev/twed0s1d (rdump)
    0  1750  1748   0  20  0  1496 1220 pause  S+    p0    0:03.95 /sbin/rdump 0Luaf raid0.psg.com:/data/backup/psg.2004-06-09/var /dev/twed0s1d (rdump)
    0  1751  1748   0  20  0  1496 1220 pause  S+    p0    0:03.95 /sbin/rdump 0Luaf raid0.psg.com:/data/backup/psg.2004-06-09/var /dev/twed0s1d (rdump)
  ...

> (2) Could you break into DDB and generate a stack trace for dump?

db> trace 1745
sched_switch(c66cb150,8b088ded,52586aad,ffc00014,c66cb150) at sched_switch+0x145
mi_switch(1,c04d9400,c66ce6e0,c04d8e52,0) at mi_switch+0x1ab
sleepq_switch(c66ce6e0,0,e3bdcc40,c04b97e1,c66ce6e0) at sleepq_switch+0x16f
sleepq_wait_sig(c66ce6e0,5c,c66ce74c,c05fc4b5,0) at sleepq_wait_sig+0x14
msleep(c66ce6e0,c66ce74c,15c,c05fc4b5,0) at msleep+0x511
kern_wait(c66cb150,ffffffff,e3bdcc8c,0,e3bdcc90) at kern_wait+0xa19
wait4(c66cb150,e3bdcd14,10,7,4) at wait4+0x32
syscall(2f,2f,2f,6d1,bfbfe0c8) at syscall+0x320
Xint0x80_syscall() at Xint0x80_syscall+0x1d
--- syscall (7, FreeBSD ELF32, wait4), eip = 0x280c970f, esp = 0xbfbfe08c, ebp = 0xbfbfe0a8 ---
db> trace 1748
sched_switch(c61e97e0,ba59592b,b60532c8,ffc06014,c61e97e0) at sched_switch+0x145
mi_switch(1,c04d9400,e3997b74,c04a61ef,0) at mi_switch+0x1ab
sleepq_switch(c64466fc,0,e3997ba8,c04b97e1,c64466fc) at sleepq_switch+0x16f
sleepq_wait_sig(c64466fc,58,0,0,0) at sleepq_wait_sig+0x14
msleep(c64466fc,0,158,c05ff4a1,0) at msleep+0x511
sbwait(c64466dc,c613e900,c64fcd20,e3997bfc,4) at sbwait+0x4b
soreceive(c6446690,0,e3997c80,0,0) at soreceive+0x2a5
soo_read(c61ff990,e3997c80,c5fcde80,0,c61e97e0) at soo_read+0x93
dofileread(c61e97e0,c61ff990,7,bfbddb98,4) at dofileread+0xdc
read(c61e97e0,e3997d14,c,c61e97e0,3) at read+0x6b
syscall(807002f,805002f,bfbd002f,7,bfbddb98) at syscall+0x320
Xint0x80_syscall() at Xint0x80_syscall+0x1d
--- syscall (3, FreeBSD ELF32, read), eip = 0x280c978f, esp = 0xbfbddb5c, ebp = 0xbfbddb78 ---
db> t 1749
sched_switch(c6162d20,d3a7fbd3,25f26a7e,ffc03014,c6162d20) at sched_switch+0x145
mi_switch(1,0,0,0,0) at mi_switch+0x1ab
sleepq_switch(c66c4560,0,e393bc90,c04b97e1,c66c4560) at sleepq_switch+0x16f
sleepq_wait_sig(c66c4560,68,0,0,0) at sleepq_wait_sig+0x14
msleep(c66c4560,c66c4594,168,c05fc591,0) at msleep+0x511
kern_sigsuspend(c6162d20,0,0,0,0) at kern_sigsuspend+0xe4
sigsuspend(c6162d20,e393bd14,4,c6162d20,1) at sigsuspend+0x4f
syscall(2f,2f,2f,6d1,bfbfe020) at syscall+0x320
Xint0x80_syscall() at Xint0x80_syscall+0x1d
--- syscall (341, FreeBSD ELF32, sigsuspend), eip = 0x280c80cf, esp = 0xbfbfe00c, ebp = 0xbfbfe038 ---
db> t 1750
sched_switch(c6161e70,8dfce68b,1b1c2e63,ffc09014,c6161e70) at sched_switch+0x145
mi_switch(1,c04d9400,c6160df8,c04d8e52,0) at mi_switch+0x1ab
sleepq_switch(c6160df8,0,e391ac90,c04b97e1,c6160df8) at sleepq_switch+0x16f
sleepq_wait_sig(c6160df8,68,c6160e2c,c05fc591,0) at sleepq_wait_sig+0x14
msleep(c6160df8,c6160e2c,168,c05fc591,0) at msleep+0x511
kern_sigsuspend(c6161e70,0,0,0,0) at kern_sigsuspend+0xe4
sigsuspend(c6161e70,e391ad14,4,c6161e70,1) at sigsuspend+0x4f
syscall(2f,2f,2f,6d1,bfbfe020) at syscall+0x320
Xint0x80_syscall() at Xint0x80_syscall+0x1d
--- syscall (341, FreeBSD ELF32, sigsuspend), eip = 0x280c80cf, esp = 0xbfbfe00c, ebp = 0xbfbfe038 ---
db> t 1751
sched_switch(c64fcd20,3f635a47,1af03fb3,ffc09014,c64fcd20) at sched_switch+0x145
mi_switch(1,c04d9400,c66413a8,c04d8e52,0) at mi_switch+0x1ab
sleepq_switch(c66413a8,0,e3adcc90,c04b97e1,c66413a8) at sleepq_switch+0x16f
sleepq_wait_sig(c66413a8,68,c66413dc,c05fc591,0) at sleepq_wait_sig+0x14
msleep(c66413a8,c66413dc,168,c05fc591,0) at msleep+0x511
kern_sigsuspend(c64fcd20,0,0,0,0) at kern_sigsuspend+0xe4
sigsuspend(c64fcd20,e3adcd14,4,c64fcd20,1) at sigsuspend+0x4f
syscall(2f,2f,2f,6d1,bfbfe020) at syscall+0x320
Xint0x80_syscall() at Xint0x80_syscall+0x1d
--- syscall (341, FreeBSD ELF32, sigsuspend), eip = 0x280c80cf, esp = 0xbfbfe00c, ebp = 0xbfbfe038 ---

> (3) Could you run "show lockedvnods" in DDB and show the results?

db> show lockedvnods
Locked vnodes

> (4) Could you run "show locks <pid>" on the dump process?

db> show locks 1745
No such command

randy
Received on Wed Jun 09 2004 - 12:10:07 UTC

This archive was generated by hypermail 2.4.0 : Wed May 19 2021 - 11:37:56 UTC