FYI I'm still seeing occasional disk:tls-duplicate-job-test failures on 
my Ubuntu 8.04 LTS regression test box. I've seen 3 failures in the past 
week.
http://regress.bacula.org/testDetails.php?test=541765&build=7356

I know that this is suspected to be a problem in the openssl libraries 
but I vaguely remember (cannot find the email referencing it at the 
moment) that a wordaround has been put into the bacula sources. If so 
then the workaround isn't 100% successful. If not then please treat this 
as a throw away message.

Thanks for everyones hard work on Bacula.

Regards

Richard


I didn't get a traceback today but here is one from a week ago. Same 
symptoms as before in Thread 3.

-------- Original Message --------
Subject: Bacula GDB traceback of bacula-sd on royalcounty
Date: Tue, 01 Feb 2011 06:14:27 +0000 (GMT)
From: ri...@oldelvet.org.uk
To: ri...@oldelvet.org.uk

[Thread debugging using libthread_db enabled]
[New Thread 0x7fcc4585a700 (LWP 1605)]
[New Thread 0x7fcc46a69700 (LWP 1603)]
[New Thread 0x7fcc46268700 (LWP 32532)]
[New Thread 0x7fcc4726a700 (LWP 32528)]
0x00007fcc47563ff3 in select () from /lib/libc.so.6
$1 = '\000' <repeats 29 times>
$2 = 0x1565088 "bacula-sd"
$3 = 0x15650c8 "/home/regress/bacula/regress/bin/bacula-sd"
$4 = 0x0
$5 = 0x7fcc48e285fb "5.1.10 (26 January 2011)"
$6 = 0x7fcc48e28621 "x86_64-unknown-linux-gnu"
$7 = 0x7fcc48e2863a "ubuntu"
$8 = 0x7fcc48e2861b "10.04"
$9 = "royalcounty", '\000' <repeats 38 times>
$10 = 0x7fcc48e28614 "ubuntu 10.04"
$11 = 0
TestName = duplicate-job-test
#0  0x00007fcc47563ff3 in select () from /lib/libc.so.6
#1  0x00007fcc48df3f54 in bnet_thread_server (addrs=<value optimized out>,
     max_clients=<value optimized out>, client_wq=<value optimized out>,
     handle_client_request=<value optimized out>) at bnet_server.c:161
#2  0x00000000004084ea in main (argc=<value optimized out>,
     argv=<value optimized out>) at stored.c:313

Thread 5 (Thread 0x7fcc4726a700 (LWP 32528)):
#0  0x00007fcc489b611d in nanosleep () from /lib/libpthread.so.0
#1  0x00007fcc48df14e7 in bmicrosleep (sec=30, usec=0) at bsys.c:63
#2  0x00007fcc48e222db in check_deadlock () at lockmgr.c:574
#3  0x00007fcc489ad9ca in start_thread () from /lib/libpthread.so.0
#4  0x00007fcc4756b70d in clone () from /lib/libc.so.6
#5  0x0000000000000000 in ?? ()

Thread 4 (Thread 0x7fcc46268700 (LWP 32532)):
#0  0x00007fcc489b2bc9 in pthread_cond_timedwait@@GLIBC_2.3.2 ()
    from /lib/libpthread.so.0
#1  0x00007fcc48e21270 in bthread_cond_timedwait_p (cond=0x7fcc490379c0,
     m=0x7fcc49037980, abstime=0x7fcc46267da0,
     file=0x7fcc48e2b772 "watchdog.c", line=321) at lockmgr.c:824
#2  0x00007fcc48e1c358 in watchdog_thread (arg=<value optimized out>)
     at watchdog.c:321
#3  0x00007fcc48e22222 in lmgr_thread_launcher (x=<value optimized out>)
     at lockmgr.c:939
#4  0x00007fcc489ad9ca in start_thread () from /lib/libpthread.so.0
#5  0x00007fcc4756b70d in clone () from /lib/libc.so.6
#6  0x0000000000000000 in ?? ()

Thread 3 (Thread 0x7fcc46a69700 (LWP 1603)):
#0  0x00007fcc489b648d in waitpid () from /lib/libpthread.so.0
#1  0x00007fcc48e122ba in signal_handler (sig=11) at signal.c:229
#2  <signal handler called>
#3  0x00007fcc48bca680 in deflate_slow (s=0x1652a30,
     flush=<value optimized out>) at deflate.c:1612
#4  0x00007fcc48bc9281 in deflate (strm=0x17b7c10, flush=2) at deflate.c:822
#5  0x00007fcc480d0a52 in zlib_stateful_compress_block (
     ctx=<value optimized out>,
     out=0x158ce9a 
"D\265\272{'\001w\201\231\367\216\371\037\212I,\213\344\307\357\326n\210Q\204\372_\300\236\265\271\203\355\071\344W\200\366\274\034\005e,\317\374\306\342\231\252&n\243\325\332\312\070\331t\341NZ\315\345>\302\203I\372W\032\252\214M\346\303[[\316\233\255\216\035:(Y\002\273w\314?k\261\263\354sMf\245\062\006\351\226\067\210eJ\v\314:!",
 
olen=17408, in=0x1660c7c "", ilen=4)
     at c_zlib.c:207
#6  0x00007fcc480cfe10 in COMP_compress_block (ctx=0x3166,
     out=0xdc1 <Address 0xdc1 out of bounds>, olen=-71945882, 
in=0x1800f70 "",
     ilen=4) at comp_lib.c:46
#7  0x00007fcc48369fae in ssl3_do_compress (ssl=<value optimized out>)
     at s3_pkt.c:498
#8  0x00007fcc4836a0ee in do_ssl3_write (s=0x15a4a40, type=23,
     buf=0x1660c7c "", len=4, create_empty_fragment=0) at s3_pkt.c:659
#9  0x00007fcc4836a606 in ssl3_write_bytes (s=0x15a4a40,
     type=<value optimized out>, buf_=0x1660c7c, len=<value optimized out>)
     at s3_pkt.c:543
#10 0x00007fcc48e13fae in openssl_bsock_readwrite (bsock=0x1702bd8,
     ptr=0x1660c7c "", nbytes=4) at tls.c:626
#11 tls_bsock_writen (bsock=0x1702bd8, ptr=0x1660c7c "", nbytes=4) at 
tls.c:704
#12 0x00007fcc48df2f43 in write_nbytes (bsock=0x3166, ptr=0x1660c7c "",
     nbytes=4) at bnet.c:131
#13 0x00007fcc48df6996 in BSOCK::send (this=0x1702bd8) at bsock.c:379
#14 0x000000000041f424 in handle_connection_request (arg=0x1702bd8)
     at dircmd.c:251
#15 0x00007fcc48e1c80d in workq_server (arg=<value optimized out>)
     at workq.c:346
#16 0x00007fcc48e22222 in lmgr_thread_launcher (x=<value optimized out>)
     at lockmgr.c:939
#17 0x00007fcc489ad9ca in start_thread () from /lib/libpthread.so.0
#18 0x00007fcc4756b70d in clone () from /lib/libc.so.6
#19 0x0000000000000000 in ?? ()

Thread 2 (Thread 0x7fcc4585a700 (LWP 1605)):
#0  0x00007fcc48bca8fb in deflate_slow (s=0x1652a30,
     flush=<value optimized out>) at deflate.c:1666
#1  0x00007fcc48bc9281 in deflate (strm=0x17b7c10, flush=2) at deflate.c:822
#2  0x00007fcc480d0a52 in zlib_stateful_compress_block (
     ctx=<value optimized out>,
     out=0x158cdda 
"\357\224\327\247\065\335\202E+\272F\243\271`KO\021\310\233^\355\331v\th~\252\306\222\032\232\211\251\021tq\247\255\324$\262\255\242(Y\270\023\035\264d\241W\276\070\003m\214Jx\315\030J\345\366\376l&\205\232Jh\343\374\323\275\206$\017\207\324\016\035]V\226\217\363\262\277\330\325\253\253=\276\326-\335\t\207\022\254k\345\060\245t\021\251\065\230\352\202~v\232\024\071Q\353\336[P\216+\205\272",
 
olen=17408, in=0x1660c7c "", ilen=198) at c_zlib.c:207
#3  0x00007fcc480cfe10 in COMP_compress_block (ctx=0x216, out=0x1810f80 "",
     olen=232424529, in=0x1820f90 "\026\002", ilen=198) at comp_lib.c:46
#4  0x00007fcc48369fae in ssl3_do_compress (ssl=<value optimized out>)
     at s3_pkt.c:498
#5  0x00007fcc4836a0ee in do_ssl3_write (s=0x15a4a40, type=23,
     buf=0x1660c7c "", len=198, create_empty_fragment=0) at s3_pkt.c:659
#6  0x00007fcc4836a606 in ssl3_write_bytes (s=0x15a4a40,
     type=<value optimized out>, buf_=0x1660c7c, len=<value optimized out>)
     at s3_pkt.c:543
#7  0x00007fcc48e13fae in openssl_bsock_readwrite (bsock=0x1702bd8,
     ptr=0x1660c7c "", nbytes=198) at tls.c:626
#8  tls_bsock_writen (bsock=0x1702bd8, ptr=0x1660c7c "", nbytes=198)
     at tls.c:704
#9  0x00007fcc48df2f43 in write_nbytes (bsock=0x216, ptr=0x1660c7c "",
     nbytes=198) at bnet.c:131
#10 0x00007fcc48df6996 in BSOCK::send (this=0x1702bd8) at bsock.c:379
#11 0x00007fcc48df6d33 in BSOCK::fsend (this=0x1702bd8,
     fmt=0x7fcc48e289b8 "Jmsg Job=%s type=%d level=%lld %s") at bsock.c:434
#12 0x00007fcc48e07af1 in dispatch_message (jcr=<value optimized out>,
     type=<value optimized out>, mtime=1296540805, msg=<value optimized 
out>)
     at message.c:882
#13 0x00007fcc48e08560 in Jmsg (jcr=0x158c408, type=6, mtime=0,
     fmt=0x4428a0 "JobId=%d Job=\"%s\" marked to be canceled.\n")
     at message.c:1290
#14 0x000000000041ec65 in cancel_cmd (cjcr=<value optimized out>)
     at dircmd.c:344
#15 0x000000000041f537 in handle_connection_request (arg=0x15a1498)
     at dircmd.c:233
#16 0x00007fcc48e1c80d in workq_server (arg=<value optimized out>)
     at workq.c:346
#17 0x00007fcc48e22222 in lmgr_thread_launcher (x=<value optimized out>)
     at lockmgr.c:939
#18 0x00007fcc489ad9ca in start_thread () from /lib/libpthread.so.0
#19 0x00007fcc4756b70d in clone () from /lib/libc.so.6
#20 0x0000000000000000 in ?? ()

Thread 1 (Thread 0x7fcc49649720 (LWP 32526)):
#0  0x00007fcc47563ff3 in select () from /lib/libc.so.6
#1  0x00007fcc48df3f54 in bnet_thread_server (addrs=<value optimized out>,
     max_clients=<value optimized out>, client_wq=<value optimized out>,
     handle_client_request=<value optimized out>) at bnet_server.c:161
#2  0x00000000004084ea in main (argc=<value optimized out>,
     argv=<value optimized out>) at stored.c:313
#0  0x00007fcc47563ff3 in select () from /lib/libc.so.6
No symbol table info available.
#1  0x00007fcc48df3f54 in bnet_thread_server (addrs=<value optimized out>,
     max_clients=<value optimized out>, client_wq=<value optimized out>,
     handle_client_request=<value optimized out>) at bnet_server.c:161
warning: Source file is more recent than executable.
161           if ((stat = select(maxfd + 1, &sockset, NULL, NULL, NULL)) < 0) {
maxfd = 3
sockset = {fds_bits = {8, 0 <repeats 15 times>}}
clilen = 16
turnon = 1
p = <value optimized out>
buf = "127.0.0.1\000\000\000\000\000\000\000\370\004e", '\000' <repeats 
37 times>"\221, \027EI\314\177\000\000\005", '\000' <repeats 15 times>, 
"r\267\342H\314\177\000\000\b(\336H\314\177\000\000\000\000\000\000\000\000\000\000\260L:\364\377\177\000\000$\000\000\000\000\000\000\000\001\000\000\000\000\000\000"
allbuf = 
"\273;\017H\314\177\000\000N\001\000\000\000\000\000\000\360GX\001\000\000\000\000\003\000\000\000\000\000\000\000\273;\017H\314\177\000\000\003\000\000\000\000\000\000\000P\000\000\000\000\000\000\000\003\000\000\000\000\000\000\000\225.X\001\000\000\000\000\002\000\000\000\314\177\000\000@\000\000\000\000\000\000\000\002\000\000\000\314\177\000\000@\000\000\000\000\000\000\000\002\000\000\000\000\000\000\000\020]X\001\000\000\000\000@>\200G\314\177\000\000\273;\017H\314\177\000\000@>\200G\314\177\000\000!R\017H\314\177\000\000\n\000\000\000\000\000\000\000\215.X\001\000\000\000\000\060]X\001\000\000\000\000\v\000\000\000\000\000\000\000\216\025PG\314\177\000\000\273;\017H\314\177\000\000N\001\000\000\000\000\000\000\020]X\001\000\000\000\000\003\000\000\000\000\000\000\000\273"...
stat = <value optimized out>
tlog = <value optimized out>
fd_ptr = 0x0
sockfds = {<SMARTALLOC> = {<No data fields>}, head = 0x7ffff43a3be0,
   tail = 0x7ffff43a3be0, loffset = 0, num_items = 1}
newsockfd = <value optimized out>
cli_addr = {sa_family = 2,
   sa_data = "\265\216\177\000\000\001\000\000\000\000\000\000\000"}
request = {fd = 5, user = '\000' <repeats 127 times>,
   daemon = "localhost-sd", '\000' <repeats 115 times>,
   pid = "32526\000\000\000\000", client = {{name = '\000' <repeats 127 
times>,
       addr = '\000' <repeats 127 times>, sin = 0x7fcc487a1b20, unit = 0x0,
       request = 0x7ffff43a4720}}, server = {{
       name = '\000' <repeats 127 times>, addr = '\000' <repeats 127 
times>,
       sin = 0x7fcc487a1aa0, unit = 0x0, request = 0x7ffff43a4720}}, 
sink = 0,
   hostname = 0x7fcc4859e3d0 <sock_hostname>,
   hostaddr = 0x7fcc4859e1b0 <sock_hostaddr>, cleanup = 0, config = 0x0}
#2  0x00000000004084ea in main (argc=<value optimized out>,
     argv=<value optimized out>) at stored.c:313
313                           &dird_workq, handle_connection_request);
test_config = false
ch = <value optimized out>
no_signals = false
thid = 140515335378688
uid = 0x0
gid = 0x0
#0  0x0000000000000000 in ?? ()
No symbol table info available.
#0  0x0000000000000000 in ?? ()
No symbol table info available.
#0  0x0000000000000000 in ?? ()
No symbol table info available.
#0  0x0000000000000000 in ?? ()
No symbol table info available.
#0  0x0000000000000000 in ?? ()
No symbol table info available.

------------------------------------------------------------------------------
The ultimate all-in-one performance toolkit: Intel(R) Parallel Studio XE:
Pinpoint memory and threading errors before they happen.
Find and fix more than 250 security defects in the development cycle.
Locate bottlenecks in serial and parallel code that limit performance.
http://p.sf.net/sfu/intel-dev2devfeb
_______________________________________________
Bacula-devel mailing list
Bacula-devel@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/bacula-devel

Reply via email to