You are viewing a plain text version of this content. The canonical link for it is here.
Posted to issues@trafficserver.apache.org by "hu xiao (JIRA)" <ji...@apache.org> on 2013/03/21 15:11:15 UTC

[jira] [Commented] (TS-1759) encouter Sig 11 while enable cluster

    [ https://issues.apache.org/jira/browse/TS-1759?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=13608958#comment-13608958 ] 

hu xiao commented on TS-1759:
-----------------------------

With -O0, gdb trace:


(gdb) ptype
type = const class Ptr<ProxyMutex> {
  public:
    ProxyMutex *m_ptr;

    void Ptr(ProxyMutex *);
    void Ptr(const Ptr<ProxyMutex> &);
    ~Ptr(int);
    void clear();
    Ptr<ProxyMutex> & operator=(Ptr<ProxyMutex> const&);
    Ptr<ProxyMutex> & operator=(ProxyMutex*);
    ProxyMutex * to_ptr();
    operator ProxyMutex*() const;
    ProxyMutex * operator->() const;
    ProxyMutex & operator*() const;
    int operator==(ProxyMutex const*);
    int operator==(Ptr<ProxyMutex> const&);
    int operator!=(ProxyMutex const*);
    int operator!=(Ptr<ProxyMutex> const&);
    RefCountObj * _ptr();
} &
(gdb) bt
#0  0x00000000004cb524 in Ptr<ProxyMutex>::operator= (this=0x845e49748, src=@0x25d0) at Ptr.h:414
#1  0x00000000006badde in UnixNetVConnection::do_io_write (this=0x845e495a0, c=0x25b8, nbytes=0, reader=0x0, owner=false)
    at UnixNetVConnection.cc:549
#2  0x0000000000564927 in HttpServerSession::do_io_write (this=0x843b4bc60, c=0x25b8, nbytes=0, buf=0x0, owner=false)
    at HttpServerSession.cc:105
#3  0x0000000000566429 in HttpSessionManager::release_session (this=0x9ecf60, to_release=0x843b4bc60) at HttpSessionManager.cc:315
#4  0x0000000000564b5d in HttpServerSession::release (this=0x843b4bc60) at HttpServerSession.cc:173
#5  0x00000000005733d3 in HttpSM::tunnel_handler_server (this=0x846ac2350, event=102, p=0x846ac40d8) at HttpSM.cc:2893
#6  0x00000000005affa7 in HttpTunnel::producer_handler (this=0x846ac3ee0, event=102, p=0x846ac40d8) at HttpTunnel.cc:1161
#7  0x00000000005b0104 in HttpTunnel::main_handler (this=0x846ac3ee0, event=100, data=0x845e496a8) at HttpTunnel.cc:1477
#8  0x00000000005b041d in chunked_reenable (p=0x846ac40d8, tunnel=0x846ac3ee0) at HttpTunnel.cc:73
#9  0x00000000005b05d7 in HttpTunnel::consumer_handler (this=0x846ac3ee0, event=101, c=0x846ac3f88) at HttpTunnel.cc:1223
#10 0x00000000005b0136 in HttpTunnel::main_handler (this=0x846ac3ee0, event=101, data=0x846ff2320) at HttpTunnel.cc:1481
#11 0x00000000004e696f in Continuation::handleEvent (this=0x846ac3ee0, event=101, data=0x846ff2320) at I_Continuation.h:146
#12 0x000000000065b1cf in ClusterHandler::cluster_signal_and_update (this=0x816ca5500, event=101, vc=0x846ff2240, s=0x846ff2318)
    at ClusterHandlerBase.cc:594
#13 0x00000000006542e6 in ClusterHandler::valid_for_data_write (this=0x816ca5500, vc=0x846ff2240) at ClusterHandler.cc:2047
#14 0x000000000065467d in ClusterHandler::build_write_descriptors (this=0x816ca5500) at ClusterHandler.cc:1602
#15 0x0000000000654abc in ClusterHandler::process_write (this=0x816ca5500, now=1363869982166845120, only_write_control_msgs=false)
    at ClusterHandler.cc:2880
#16 0x0000000000655545 in ClusterHandler::mainClusterEvent (this=0x816ca5500, event=5, e=0x81c356f60) at ClusterHandler.cc:2507
#17 0x00000000004e696f in Continuation::handleEvent (this=0x816ca5500, event=5, data=0x81c356f60) at I_Continuation.h:146
#18 0x00000000006ddddc in EThread::process_event (this=0x843247000, e=0x81c356f60, calling_code=5) at UnixEThread.cc:142
#19 0x00000000006de27e in EThread::execute (this=0x843247000) at UnixEThread.cc:266
#20 0x00000000006dd729 in spawn_thread_internal (a=0x80512d070) at Thread.cc:88
#21 0x0000000800e1bd14 in pthread_getprio () from /lib/libthr.so.3
#22 0x0000000000000000 in ?? ()

                
> encouter Sig 11 while enable cluster
> ------------------------------------
>
>                 Key: TS-1759
>                 URL: https://issues.apache.org/jira/browse/TS-1759
>             Project: Traffic Server
>          Issue Type: Bug
>          Components: Clustering
>            Reporter: hu xiao
>
> I have two box running ATS and they are nomally when running separately. 
> But if enable cluster, they are random reboot, and have " Sig 11 " in traffic.out.
> The core.dump in gdb :
> Core was generated by `traffic_server'.
> Program terminated with signal 11, Segmentation fault.
> Reading symbols from /usr/local/trafficserver/lib/libtsutil.so.6...done.
> Loaded symbols for /usr/local/trafficserver/lib/libtsutil.so.6
> Reading symbols from /lib/libthr.so.3...done.
> Loaded symbols for /lib/libthr.so.3
> Reading symbols from /usr/lib/librt.so.1...done.
> Loaded symbols for /usr/lib/librt.so.1
> Reading symbols from /usr/local/lib/libpcre.so.3...done.
> Loaded symbols for /usr/local/lib/libpcre.so.3
> Reading symbols from /usr/lib/libssl.so.6...done.
> Loaded symbols for /usr/lib/libssl.so.6
> Reading symbols from /lib/libcrypto.so.6...done.
> Loaded symbols for /lib/libcrypto.so.6
> Reading symbols from /usr/local/lib/libtcl85.so.1...done.
> Loaded symbols for /usr/local/lib/libtcl85.so.1
> Reading symbols from /usr/local/lib/libexpat.so.6...done.
> Loaded symbols for /usr/local/lib/libexpat.so.6
> Reading symbols from /usr/local/lib/libiconv.so.3...done.
> Loaded symbols for /usr/local/lib/libiconv.so.3
> Reading symbols from /lib/libz.so.6...done.
> Loaded symbols for /lib/libz.so.6
> Reading symbols from /usr/lib/liblzma.so.5...done.
> Loaded symbols for /usr/lib/liblzma.so.5
> Reading symbols from /usr/local/lib/libexecinfo.so.1...done.
> Loaded symbols for /usr/local/lib/libexecinfo.so.1
> Reading symbols from /usr/lib/libstdc++.so.6...done.
> Loaded symbols for /usr/lib/libstdc++.so.6
> Reading symbols from /lib/libm.so.5...done.
> Loaded symbols for /lib/libm.so.5
> Reading symbols from /lib/libgcc_s.so.1...done.
> Loaded symbols for /lib/libgcc_s.so.1
> Reading symbols from /lib/libc.so.7...done.
> Loaded symbols for /lib/libc.so.7
> Reading symbols from /usr/lib/libsupc++.so.1...done.
> Loaded symbols for /usr/lib/libsupc++.so.1
> Reading symbols from /libexec/ld-elf.so.1...done.
> Loaded symbols for /libexec/ld-elf.so.1
> #0  UnixNetVConnection::do_io_write (this=0x81b5cc240, c=0xfab8, nbytes=0, reader=0x0, owner=false) at Ptr.h:414
> 414     Ptr.h: No such file or directory.
>         in Ptr.h
> [New Thread 8050e8c00 (LWP 100933/traffic_server)]
> [New Thread 8050e8800 (LWP 100932/traffic_server)]
> [New Thread 8050e8400 (LWP 100931/traffic_server)]
> [New Thread 8050e8000 (LWP 100930/traffic_server)]
> [New Thread 8050e7c00 (LWP 100929/traffic_server)]
> [New Thread 80380e400 (LWP 100928/traffic_server)]
> [New Thread 80380e000 (LWP 100927/traffic_server)]
> [New Thread 80380dc00 (LWP 100926/traffic_server)]
> [New Thread 80380d800 (LWP 100925/traffic_server)]
> [New Thread 80380d400 (LWP 100924/traffic_server)]
> [New Thread 80380d000 (LWP 100923/traffic_server)]
> [New Thread 80380cc00 (LWP 100922/traffic_server)]
> [New Thread 80380c800 (LWP 100921/traffic_server)]
> [New Thread 80380c400 (LWP 100920/traffic_server)]
> [New Thread 80380c000 (LWP 100919/traffic_server)]
> [New Thread 80380bc00 (LWP 100918/traffic_server)]
> [New Thread 80380b800 (LWP 100917/traffic_server)]
> [New Thread 80380b400 (LWP 100916/traffic_server)]
> [New Thread 80380b000 (LWP 100915/traffic_server)]
> [New Thread 80380ac00 (LWP 100914/traffic_server)]
> [New Thread 80380a800 (LWP 100882/traffic_server)]
> [New Thread 80380a400 (LWP 100881/traffic_server)]
> [New Thread 80380a000 (LWP 100877/traffic_server)]
> [New Thread 803809c00 (LWP 100875/traffic_server)]
> [New Thread 803809800 (LWP 100874/traffic_server)]
> [New Thread 803809400 (LWP 100873/traffic_server)]
> [New Thread 803809000 (LWP 100872/traffic_server)]
> [New Thread 803808c00 (LWP 100871/traffic_server)]
> [New Thread 803808800 (LWP 100870/traffic_server)]
> [New Thread 803808400 (LWP 100869/traffic_server)]
> [New Thread 803807800 (LWP 100867/traffic_server)]
> [New Thread 803807400 (LWP 100241/traffic_server)]
> (gdb) bt
> #0  UnixNetVConnection::do_io_write (this=0x81b5cc240, c=0xfab8, nbytes=0, reader=0x0, owner=false) at Ptr.h:414
> #1  0x0000000000526a71 in HttpSessionManager::release_session (this=0x9aad60, to_release=0x8036dd860) at HttpSessionManager.cc:309
> #2  0x000000000052ee22 in HttpSM::tunnel_handler_server (this=0x81b6c6e30, event=58905600, p=0x8036dd860) at HttpSM.cc:2893
> #3  0x000000000057d92c in HttpTunnel::producer_handler (this=0x81b6c89c0, event=102, p=0x81b6c8bb8) at HttpTunnel.cc:1161
> #4  0x000000000057deff in HttpTunnel::main_handler (this=0x81b6c89c0, event=<value optimized out>, data=<value optimized out>) at HttpTunnel.cc:1477
> #5  0x000000000057e251 in chunked_reenable (p=0x81b6c8bb8, tunnel=0x81b6c89c0) at HttpTunnel.cc:73
> #6  0x000000000057e42e in HttpTunnel::consumer_handler (this=0x81b6c89c0, event=101, c=0x81b6c8a68) at HttpTunnel.cc:1223
> #7  0x000000000057de5b in HttpTunnel::main_handler (this=0x81b6c89c0, event=<value optimized out>, data=<value optimized out>) at HttpTunnel.cc:1481
> #8  0x0000000000626473 in ClusterHandler::cluster_signal_and_update (this=0x84873d500, event=101, vc=0x844ed0500, s=<value optimized out>)
>     at I_Continuation.h:146
> #9  0x0000000000623b03 in ClusterHandler::valid_for_data_write (this=0x84873d500, vc=0x844ed0500) at ClusterHandler.cc:2047
> #10 0x00000000006243e8 in ClusterHandler::build_write_descriptors (this=0x84873d500) at ClusterHandler.cc:1602
> #11 0x0000000000624bfd in ClusterHandler::process_write (this=0x84873d500, now=1363698900503840961, only_write_control_msgs=false)
>     at ClusterHandler.cc:2880
> #12 0x0000000000624eb2 in ClusterHandler::mainClusterEvent (this=0x84873d500, event=<value optimized out>, e=0x81bce0000) at ClusterHandler.cc:2507
> #13 0x00000000006c6ae0 in EThread::process_event (this=0x846e88000, e=0x81bce0000, calling_code=5) at I_Continuation.h:146
> #14 0x00000000006c72ba in EThread::execute (this=0x846e88000) at UnixEThread.cc:266
> #15 0x00000000006c661a in spawn_thread_internal (a=0x80507a070) at Thread.cc:88
> #16 0x0000000800dc9d14 in pthread_getprio () from /lib/libthr.so.3
> #17 0x0000000000000000 in ?? ()
> # uname -a
> FreeBSD fw2 9.1-STABLE FreeBSD 9.1-STABLE #3 r248486: Tue Mar 19 11:39:02 CST 2013     root@mm.lsxedu.com:/usr/obj/usr/src/sys/JW  amd64

--
This message is automatically generated by JIRA.
If you think it was sent incorrectly, please contact your JIRA administrators
For more information on JIRA, see: http://www.atlassian.com/software/jira