Forum OpenACS Q&A: Re: naviserver signal 11 core backtrace

Collapse
Posted by Marty Israelsen on

We just received another core dump.   This one is different than the first.   The core file was only 9Gig rather than the 22Gig that the first core file was.

Also it's backtrace is different as well.   Any insights you might be able to provide are much appreciated.

Thanks,

Marty

[Thread debugging using libthread_db enabled]
Using host libthread_db library "/lib/x86_64-linux-gnu/libthread_db.so.1".
--Type <RET> for more, q to quit, c to continue without paging--
Core was generated by `/usr/local/ns/bin/nsd -u root -g web -i -t /web/etc/config.tcl'.
Program terminated with signal SIGSEGV, Segmentation fault.
#0  __GI_abort () at abort.c:107
107     abort.c: No such file or directory.
[Current thread is 1 (Thread 0x7f0f25ffb700 (LWP 88))]
(gdb) bt full
#0  __GI_abort () at abort.c:107
        act = {__sigaction_handler = {sa_handler = 0x0, sa_sigaction = 0x0}, sa_mask = {__val = {18446744073709551615 <repeats 16 times>}}, sa_flags = 0,
          sa_restorer = 0x0}
        sigs = {__val = {32, 0 <repeats 15 times>}}
#1  0x00007f106e4b3064 in skgdbgcra () from /opt/oracle/instantclient_21_1/libclntsh.so.21.1
No symbol table info available.
#2  0x00007f106e480693 in skgesigCrash () from /opt/oracle/instantclient_21_1/libclntsh.so.21.1
No symbol table info available.
#3  0x00007f106e4809de in skgesig_sigactionHandler () from /opt/oracle/instantclient_21_1/libclntsh.so.21.1
No symbol table info available.
#4  <signal handler called>
No locals.
#5  __GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:50
        set = {__val = {21511, 80, 139703038744752, 8657047456, 139702468349856, 139702401236992, 80, 7011059030223806464, 139708720069238, 139708720069238,
            139703038744960, 139708723414222, 0, 24, 139702468349856, 139703139720792}}
        pid = <optimized out>
        tid = <optimized out>
        ret = <optimized out>
#6  0x00007f1078af5859 in __GI_abort () at abort.c:79
        save_stage = 1
        act = {__sigaction_handler = {sa_handler = 0x55befb7066c0, sa_sigaction = 0x55befb7066c0}, sa_mask = {__val = {139702468349584, 139703038745072, 1, 0,
              139703139720784, 0, 139702468349856, 0, 7011059030223806464, 139703038745152, 139708723406150, 40, 139703038745184, 139708724032495,
              12884901888, 139703139720784}}, sa_flags = 67112592, sa_restorer = 0x7f1078a1ba76}
        sigs = {__val = {32, 0 <repeats 15 times>}}
#7  0x00007f1078d4a995 in Panic (fmt=0x7f1078de33ef "received fatal signal %d") at log.c:943
        ap = {{gp_offset = 8, fp_offset = 48, overflow_arg_area = 0x7f0f25ff9b40, reg_save_area = 0x7f0f25ff9a80}}
#8  0x00007f10789bef8d in Tcl_PanicVA (format=<optimized out>, argList=argList@entry=0x7f0f25ff9b80) at /usr/local/src/tcl8.6.11/generic/tclPanic.c:99
        arg1 = 0xb <error: Cannot access memory at address 0xb>
        arg2 = 0x0
        arg3 = 0x7f1078b1603b <__GI_raise+203> "H\213\204$\b\001"
        arg4 = 0x0
        arg5 = 0x7f0f25ff9800 "\aT"
        arg6 = 0x246 <error: Cannot access memory at address 0x246>
        arg7 = 0xbffffffff <error: Cannot access memory at address 0xbffffffff>
        arg8 = 0x0
#9  0x00007f10789bf0ff in Tcl_Panic (format=<optimized out>) at /usr/local/src/tcl8.6.11/generic/tclPanic.c:160
        argList = {{gp_offset = 48, fp_offset = 48, overflow_arg_area = 0x7f0f25ff9c78, reg_save_area = 0x7f0f25ff9ba0}}
#10 0x00007f1078db491b in Abort (signal=11) at unix.c:1119
No locals.
#11 <signal handler called>
No locals.
#12 0x00007f10783d940e in __pthread_rwlock_rdlock_full (abstime=0x0, clockid=0, rwlock=0x7f1078a1ba76) at pthread_rwlock_common.c:353
        r = <optimized out>
        wpf = <optimized out>
        ready = <optimized out>
        r = <optimized out>
        wpf = <optimized out>
        ready = <optimized out>
        __value = <optimized out>
        private = <optimized out>
        err = <optimized out>
        private = <optimized out>
        private = <optimized out>
        err = <optimized out>
#13 __GI___pthread_rwlock_rdlock (rwlock=0x7f1078a1ba76) at pthread_rwlock_rdlock.c:27
        result = <optimized out>
#14 0x00007f1078a7399d in Ns_RWLockRdLock (rwPtr=0x7f1078a65c90 <cmds+16>) at rwlock.c:355
        lockPtr = 0x7f1078a1ba76
        err = 16
        busy = true
        __PRETTY_FUNCTION__ = "Ns_RWLockRdLock"
--Type <RET> for more, q to quit, c to continue without paging--
#15 0x00007f1078d821c1 in UpdateInterp (itPtr=0x7f0e9c706f40) at tclinit.c:2278
        servPtr = 0x7f1078a65980 <tclVarHashKeyType>
        result = 0
        epoch = -1670353088
        scriptLength = 0
        script = 0x0
        doUpdateNow = false
        __PRETTY_FUNCTION__ = "UpdateInterp"
#16 0x00007f1078d81c97 in PopInterp (servPtr=0x7f1078a65980 <tclVarHashKeyType>, interp=0x7f10603fbbe0) at tclinit.c:1964
        itPtr = 0x7f0e9c706f40
        hPtr = 0x7f0e5818f3f0
        lock = 0x0
#17 0x00007f1078d7ff35 in NsTclAllocateInterp (servPtr=0x7f1078a65980 <tclVarHashKeyType>) at tclinit.c:503
        itPtr = 0x7f104a7fb37f
#18 0x00007f1078d2622e in NsTclConnChanProc (UNUSED_sock=10, arg=0x7f0dcd43f840, why=1) at connchan.c:601
        interp = 0x7f0f0400d9b0
        w = 0x7f1078dc07d6 "r"
        localsock = 3
        result = 0
        script = {string = 0x7f0f25ffab40 "::revproxy::spool conn829545 conn829544 client {-timeout 0 -sendtimeout 0.0 -receivetimeout 0.5} 0 r",
          length = 100, spaceAvl = 200,
          staticSpace = "::revproxy::spool conn829545 conn829544 client {-timeout 0 -sendtimeout 0.0 -receivetimeout 0.5} 0 r\000_n.js?u\005\000\000\000id=313895 {-tim\000\020\254\377%\017\177\000\000|\243\324x\020\177\000\000ut 0.0 -0\254\377%\017\177\000\000\266i\335x\020\177\000\000\300\254\377%\005\000\000\000\200\254\377%\017\177\000\000\066U\247x\020\177\000\000\060 r\000\060\000\000"}
        channelName = 0x0
        logEnabled = false
        scriptCmdNameLength = 0
        whenBuffer = "r\000\000\000\000"
        servPtr = 0x7f1078a65980 <tclVarHashKeyType>
        cbPtr = 0x7f0dcd43f840
        success = true
        __PRETTY_FUNCTION__ = "NsTclConnChanProc"
#19 0x00007f1078d69aba in SockCallbackThread (UNUSED_arg=0x0) at sockcallback.c:531
        stop = false
        pollTimeout = 30000
        nfds = 4
        now = {sec = 1650320393, usec = 649423}
        diff = {sec = 0, usec = 0}
        c = 0 '\000'
        when = {1, 2, 20}
        events = {1, 4, 2}
        n = 2
        i = 0
        isNew = 0
        maxPollfds = 100
        cbPtr = 0x7f0dccfa65a0
        nextPtr = 0x0
        hPtr = 0x7f0f5809dc30
        search = {tablePtr = 0x7f1078e0d800 <activeCallbacks>, nextIndex = 5, nextEntryPtr = 0x0}
        pfds = 0x7f0f040012b0
#20 0x00007f1078a74538 in NsThreadMain (arg=0x7f1031b4af90) at thread.c:232
        thrPtr = 0x7f1031b4af90
#21 0x00007f1078a762b7 in ThreadMain (arg=0x7f1031b4af90) at pthread.c:870
No locals.
#22 0x00007f10783d4609 in start_thread (arg=<optimized out>) at pthread_create.c:477
        ret = <optimized out>
        pd = <optimized out>
        unwind_buf = {cancel_jmp_buf = {{jmp_buf = {139703038752512, 1689291541696144044, 139707946087294, 139707946087295, 139707946087488, 139703038750464,
                -1625840922042375508, -1634417650425863508}, mask_was_saved = 0}}, priv = {pad = {0x0, 0x0, 0x0, 0x0}, data = {prev = 0x0, cleanup = 0x0,
              canceltype = 0}}}
        not_first_call = 0
--Type <RET> for more, q to quit, c to continue without paging--
#23 0x00007f1078bf2163 in clone () at ../sysdeps/unix/sysv/linux/x86_64/clone.S:95
No locals.
​​​​​​​