Bacula-users

Re: [Bacula-users] Storage daemons dies on restore

2008-07-22 04:12:31
Subject: Re: [Bacula-users] Storage daemons dies on restore
From: Andrea Venturoli <ml AT netfence DOT it>
To: Martin Simmons <martin AT lispworks DOT com>
Date: Tue, 22 Jul 2008 10:10:33 +0200
Martin Simmons ha scritto:

> The best thing is to attach gdb to the running SD soon after it starts and 
>  then use the commands 
>  
>  bt 
>  info all 
>  thread apply all bt 
>  
>  to generate a report when it crashes. 

Here it is:

Program received signal SIGSEGV, Segmentation fault.
[Switching to Thread 0x5de400 (LWP 100153)]
0x000000000040bb39 in acquire_device_for_read (dcr=0x5d0028) at 
acquire.c:269
269              ASSERT(0);
Current language:  auto; currently c++
(gdb) up
#1  0x000000000042c958 in mount_next_read_volume (dcr=0x5d0028) at 
mount.c:790
790           if (!acquire_device_for_read(dcr)) {
(gdb) do
#0  0x000000000040bb39 in acquire_device_for_read (dcr=0x5d0028) at 
acquire.c:269
269              ASSERT(0);
(gdb) bt
#0  0x000000000040bb39 in acquire_device_for_read (dcr=0x5d0028) at 
acquire.c:269
#1  0x000000000042c958 in mount_next_read_volume (dcr=0x5d0028) at 
mount.c:790
#2  0x000000000042f2ab in read_records (dcr=0x5d0028, record_cb=0x42ee40 
<record_cb>, mount_cb=0x42c8b0 <mount_next_read_volume(DCR*)>) at 
read_record.c:86
#3  0x000000000042edd5 in do_read_data (jcr=0x5dec28) at read.c:86
#4  0x0000000000423568 in read_data_cmd (jcr=0x5dec28) at fd_cmds.c:280
#5  0x0000000000423099 in do_fd_commands (jcr=0x5dec28) at fd_cmds.c:165
#6  0x0000000000422ee3 in run_job (jcr=0x5dec28) at fd_cmds.c:128
#7  0x000000000042471c in run_cmd (jcr=0x5dec28) at job.c:210
#8  0x000000000041d5bd in handle_connection_request (arg=0x5bca28) at 
dircmd.c:232
#9  0x0000000000461753 in workq_server (arg=0x58de00) at workq.c:357
#10 0x00000008007d36e9 in pthread_create () from /lib/libpthread.so.2
#11 0x00000008013eae04 in makecontext () from /lib/libc.so.6
#12 0x0000000000000000 in ?? ()
#13 0x00000000005de400 in ?? ()
#14 0x00000000004614f0 in workq_remove () at workq.c:288


(gdb) info all
rax            0x0      0
rbx            0x5b8fc0 6000576
rcx            0x4      4
rdx            0x5b8028 5996584
rsi            0x7fffff3f8ecc   140737475743436
rdi            0x7fffff3f8ec0   140737475743424
rbp            0x7fffff3fa5a0   0x7fffff3fa5a0
rsp            0x7fffff3fa410   0x7fffff3fa410
r8             0x30e    782
r9             0x0      0
r10            0x0      0
r11            0x0      0
r12            0x5dec28 6155304
r13            0x0      0
r14            0x0      0
r15            0x23     35
rip            0x40bb39 0x40bb39 <acquire_device_for_read(DCR*)+3177>
eflags         0x10202  66050
cs             0x2b     43
ss             0x23     35
ds             0x0      0
es             0x0      0
fs             0x0      0
gs             0x0      0
st0            0        (raw 0x00000000000000000000)
st1            0        (raw 0x00000000000000000000)
st2            0        (raw 0x00000000000000000000)
st3            0        (raw 0x00000000000000000000)
st4            0        (raw 0x00000000000000000000)
st5            0        (raw 0x00000000000000000000)
st6            0        (raw 0x00000000000000000000)
st7            0        (raw 0x00000000000000000000)
fctrl          0x37f    895
fstat          0x0      0
ftag           0xffff   65535
fiseg          0x0      0
fioff          0x0      0
foseg          0x0      0
fooff          0x0      0
fop            0x0      0
xmm0           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm1           {f = {0x0, 0x4, 0x0, 0x0}}       {f = {0, 4.5, 0, 0}}
xmm2           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm3           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm4           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm5           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm6           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm7           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm8           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm9           {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm10          {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm11          {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm12          {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm13          {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm14          {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
xmm15          {f = {0x0, 0x0, 0x0, 0x0}}       {f = {0, 0, 0, 0}}
mxcsr          0x1f80   8064


(gdb) thread apply all bt

Thread 5 (Thread 0x5de400 (LWP 100153)):
#0  0x000000000040bb39 in acquire_device_for_read (dcr=0x5d0028) at 
acquire.c:269
#1  0x000000000042c958 in mount_next_read_volume (dcr=0x5d0028) at 
mount.c:790
#2  0x000000000042f2ab in read_records (dcr=0x5d0028, record_cb=0x42ee40 
<record_cb>, mount_cb=0x42c8b0 <mount_next_read_volume(DCR*)>) at 
read_record.c:86
#3  0x000000000042edd5 in do_read_data (jcr=0x5dec28) at read.c:86
#4  0x0000000000423568 in read_data_cmd (jcr=0x5dec28) at fd_cmds.c:280
#5  0x0000000000423099 in do_fd_commands (jcr=0x5dec28) at fd_cmds.c:165
#6  0x0000000000422ee3 in run_job (jcr=0x5dec28) at fd_cmds.c:128
#7  0x000000000042471c in run_cmd (jcr=0x5dec28) at job.c:210
#8  0x000000000041d5bd in handle_connection_request (arg=0x5bca28) at 
dircmd.c:232
#9  0x0000000000461753 in workq_server (arg=0x58de00) at workq.c:357
#10 0x00000008007d36e9 in pthread_create () from /lib/libpthread.so.2
#11 0x00000008013eae04 in makecontext () from /lib/libc.so.6
#12 0x0000000000000000 in ?? ()
#13 0x00000000005de400 in ?? ()
#14 0x00000000004614f0 in workq_remove () at workq.c:288

Thread 4 (LWP 100226):
#0  0x000000000040bb39 in acquire_device_for_read (dcr=0x5d0028) at 
acquire.c:269
#1  0x000000000042c958 in mount_next_read_volume (dcr=0x5d0028) at 
mount.c:790
#2  0x000000000042f2ab in read_records (dcr=0x5d0028, record_cb=0x42ee40 
<record_cb>, mount_cb=0x42c8b0 <mount_next_read_volume(DCR*)>) at 
read_record.c:86
#3  0x000000000042edd5 in do_read_data (jcr=0x5dec28) at read.c:86
#4  0x0000000000423568 in read_data_cmd (jcr=0x5dec28) at fd_cmds.c:280
#5  0x0000000000423099 in do_fd_commands (jcr=0x5dec28) at fd_cmds.c:165
#6  0x0000000000422ee3 in run_job (jcr=0x5dec28) at fd_cmds.c:128
#7  0x000000000042471c in run_cmd (jcr=0x5dec28) at job.c:210
#8  0x000000000041d5bd in handle_connection_request (arg=0x5bca28) at 
dircmd.c:232
#9  0x0000000000461753 in workq_server (arg=0x58de00) at workq.c:357
#10 0x00000008007d36e9 in pthread_create () from /lib/libpthread.so.2
#11 0x00000008013eae04 in makecontext () from /lib/libc.so.6
#12 0x0000000000000000 in ?? ()
#13 0x00000000005de400 in ?? ()
#14 0x00000000004614f0 in workq_remove () at workq.c:288

Thread 3 (Thread 0x59a000 (runnable)):
#0  0x000000080147fe8c in select () from /lib/libc.so.6
#1  0x00000008007cb47d in select () from /lib/libpthread.so.2
#2  0x00000000004409c6 in bnet_thread_server (addrs=0x590928, 
max_clients=41, client_wq=0x58de00,
     handle_client_request=0x41cfb0 <handle_connection_request(void*)>) 
at bnet_server.c:161
#3  0x0000000000406869 in main (argc=0, argv=0x7fffffffe810) at stored.c:264

Thread 2 (Thread 0x5bd000 (LWP 100150)):
#0  0x00000008007e1eec in pthread_testcancel () from /lib/libpthread.so.2
#1  0x0000000000000000 in ?? ()
#2  0x0000000000000000 in ?? ()
#3  0x000000000000001e in ?? ()
#4  0x0000000000000000 in ?? ()
#5  0x00000000005bd000 in ?? ()
#6  0x00000000005bd000 in ?? ()
#7  0x000000000059a000 in ?? ()
#8  0x00000008007da47a in pthread_mutexattr_init () from 
/lib/libpthread.so.2
#9  0x0000000000000000 in ?? ()
Error accessing memory address 0x7fffffbff000: Bad address.
0x000000000040bb39      269              ASSERT(0);




I guess I should really file that bug report, but I'm lost wrt how to 
describe this in details.



  bye & Thanks
        av.

-------------------------------------------------------------------------
This SF.Net email is sponsored by the Moblin Your Move Developer's challenge
Build the coolest Linux based applications with Moblin SDK & win great prizes
Grand prize is a trip for two to an Open Source event anywhere in the world
http://moblin-contest.org/redirect.php?banner_id=100&url=/
_______________________________________________
Bacula-users mailing list
Bacula-users AT lists.sourceforge DOT net
https://lists.sourceforge.net/lists/listinfo/bacula-users