• Type: Icon: Bug Bug
    • Resolution: Incomplete
    • Priority: Icon: Major - P3 Major - P3
    • None
    • Affects Version/s: None
    • Component/s: None
    • Labels:
      None
    • ALL

      I see a crash on my 3.0.5 wired tiger server. Here is the relevant section

      2016-02-22T03:24:54.330+0000 F -        [ReplExecNetThread-1] Got signal: 6 (Aborted).
       
      0xf74fc9 0xf74642 0xf749f6 0x7f4f4e13a670 0x7f4f4e13a5f7 0x7f4f4e13bce8 0xdacd29 0x89421d 0x894e27 0x8671b7 0x88f2b6 0x84d3a1 0x853dee 0x84640d 0xc3a0ad 0xc3a5d4 0xc3ad8c 0xc3b39d 0xfc3104
      0x7f4f4f748dc5 0x7f4f4e1fbbdd
      ----- BEGIN BACKTRACE -----
      {"backtrace":[{"b":"400000","o":"B74FC9"},{"b":"400000","o":"B74642"},{"b":"400000","o":"B749F6"},{"b":"7F4F4E105000","o":"35670"},{"b":"7F4F4E105000","o":"355F7"},{"b":"7F4F4E105000","o":"3
      6CE8"},{"b":"400000","o":"9ACD29"},{"b":"400000","o":"49421D"},{"b":"400000","o":"494E27"},{"b":"400000","o":"4671B7"},{"b":"400000","o":"48F2B6"},{"b":"400000","o":"44D3A1"},{"b":"400000","
      o":"453DEE"},{"b":"400000","o":"44640D"},{"b":"400000","o":"83A0AD"},{"b":"400000","o":"83A5D4"},{"b":"400000","o":"83AD8C"},{"b":"400000","o":"83B39D"},{"b":"400000","o":"BC3104"},{"b":"7F4
      F4F741000","o":"7DC5"},{"b":"7F4F4E105000","o":"F6BDD"}],"processInfo":{ "mongodbVersion" : "3.0.5", "gitVersion" : "8bc4ae20708dbb493cb09338d9e7be6698e4a3a3", "uname" : { "sysname" : "Linux
      ", "release" : "3.10.37-47.135.amzn1.x86_64", "version" : "#1 SMP Fri Apr 18 03:28:26 UTC 2014", "machine" : "x86_64" }, "somap" : [ { "elfType" : 2, "b" : "400000", "buildId" : "F2642585C8D
      FF37F942ABBAF84DEA258651EC3C8" }, { "b" : "7FFF304DB000", "elfType" : 3, "buildId" : "A9D61CE6B4FC467291ED5B3AD5418A1F5DEA012E" }, { "b" : "7F4F4F741000", "path" : "/lib64/libpthread.so.0",
      "elfType" : 3, "buildId" : "E5E575776DAD20ADE8FD0CAF17897C9D89020A87" }, { "b" : "7F4F4F4D4000", "path" : "/usr/lib64/libssl.so.10", "elfType" : 3, "buildId" : "B949A1349FF0E93409055F00BFD60
      F758EE8FA02" }, { "b" : "7F4F4F0EF000", "path" : "/lib64/libcrypto.so.10", "elfType" : 3, "buildId" : "F444116328F54797379DAA3B0FD53CF6C829F22A" }, { "b" : "7F4F4EEE7000", "path" : "/lib64/l
      ibrt.so.1", "elfType" : 3, "buildId" : "42833B65941483A611C40EA7D32F56EA83EA6E93" }, { "b" : "7F4F4ECE3000", "path" : "/lib64/libdl.so.2", "elfType" : 3, "buildId" : "6335077ACD51527BE9F2F18
      451A88E2B7350C5B6" }, { "b" : "7F4F4E9DF000", "path" : "/usr/lib64/libstdc++.so.6", "elfType" : 3, "buildId" : "5E2AE3B2E1D3984B4DE32FE73D221D8C425516E5" }, { "b" : "7F4F4E6DD000", "path" :
      "/lib64/libm.so.6", "elfType" : 3, "buildId" : "BB312C4A65B8FD830C148612CBEACEACC8B08E4F" }, { "b" : "7F4F4E4C7000", "path" : "/lib64/libgcc_s.so.1", "elfType" : 3, "buildId" : "00FA2883FB47
      B1327397BBF167C52F51A723D013" }, { "b" : "7F4F4E105000", "path" : "/lib64/libc.so.6", "elfType" : 3, "buildId" : "D84E3AFDFF3E164A09C125F85B5DCABC6F545B5E" }, { "b" : "7F4F4F95D000", "path"
      : "/lib64/ld-linux-x86-64.so.2", "elfType" : 3, "buildId" : "7B7BF8FEEF1A9C627EF90CA5C9188EFD4DA2DDD2" }, { "b" : "7F4F4DEB9000", "path" : "/lib64/libgssapi_krb5.so.2", "elfType" : 3, "build
      Id" : "E203354E7F907ACC8C3028FE465541B666DCFBA0" }, { "b" : "7F4F4DBD4000", "path" : "/lib64/libkrb5.so.3", "elfType" : 3, "buildId" : "D769C8FFAF8772FDA55031ABF2E167DF2207E378" }, { "b" : "
      7F4F4D9D1000", "path" : "/usr/lib64/libcom_err.so.2", "elfType" : 3, "buildId" : "5C01209C5AE1B1714F19B07EB58F2A1274B69DC8" }, { "b" : "7F4F4D79F000", "path" : "/lib64/libk5crypto.so.3", "el
      fType" : 3, "buildId" : "6C2243D37143F7FD1E16ED1F6CE4D7F16C2D7EF1" }, { "b" : "7F4F4D589000", "path" : "/lib64/libz.so.1", "elfType" : 3, "buildId" : "89C6AF118B6B4FB6A73AE1813E2C8BDD722956D
      1" }, { "b" : "7F4F4D37A000", "path" : "/lib64/libkrb5support.so.0", "elfType" : 3, "buildId" : "744272FEAAABCE629AB9E11FAA4A96AEBE8BC2B4" }, { "b" : "7F4F4D177000", "path" : "/lib64/libkeyu
      tils.so.1", "elfType" : 3, "buildId" : "37A58210FA50C91E09387765408A92909468D25B" }, { "b" : "7F4F4CF5D000", "path" : "/lib64/libresolv.so.2", "elfType" : 3, "buildId" : "47EC2C63132D25E4FE8
      3F77023DA1A66457A88F1" }, { "b" : "7F4F4CD3C000", "path" : "/usr/lib64/libselinux.so.1", "elfType" : 3, "buildId" : "F5054DC94443326819FBF3065CFDF5E4726F57EE" } ] }}
       mongod(_ZN5mongo15printStackTraceERSo+0x29) [0xf74fc9]
       mongod(+0xB74642) [0xf74642]
       mongod(+0xB749F6) [0xf749f6]
       libc.so.6(+0x35670) [0x7f4f4e13a670]
       libc.so.6(gsignal+0x37) [0x7f4f4e13a5f7]
       libc.so.6(abort+0x148) [0x7f4f4e13bce8]
       mongod(_ZN5mongo12SecureRandom6createEv+0x1B9) [0xdacd29]
       mongod(_ZN5mongo31SaslSCRAMSHA1ClientConversation10_firstStepEPSs+0x16D) [0x89421d]
       mongod(_ZN5mongo31SaslSCRAMSHA1ClientConversation4stepERKNS_10StringDataEPSs+0x247) [0x894e27]
       mongod(_ZN5mongo23NativeSaslClientSession4stepERKNS_10StringDataEPSs+0x27) [0x8671b7]
       mongod(+0x48F2B6) [0x88f2b6]
       mongod(_ZN5mongo20DBClientWithCommands5_authERKNS_7BSONObjE+0x191) [0x84d3a1]
       mongod(_ZN5mongo18DBClientConnection5_authERKNS_7BSONObjE+0x16E) [0x853dee]
       mongod(_ZN5mongo20DBClientWithCommands4authERKNS_7BSONObjE+0x1D) [0x84640d]
       mongod(_ZN5mongo4repl20NetworkInterfaceImpl14ConnectionPool17acquireConnectionERKNS_11HostAndPortENS_6Date_tEN5boost9date_time18subsecond_durationINS7_10posix_time13time_durationELl1000EEE+
      0x26D) [0xc3a0ad]
       mongod(_ZN5mongo4repl20NetworkInterfaceImpl11_runCommandERKNS0_19ReplicationExecutor20RemoteCommandRequestE+0xC4) [0xc3a5d4]
       mongod(_ZN5mongo4repl20NetworkInterfaceImpl23_consumeNetworkRequestsEv+0x15C) [0xc3ad8c]
       mongod(_ZN5mongo4repl20NetworkInterfaceImpl27_requestProcessorThreadBodyEPS1_RKSs+0x8D) [0xc3b39d]
       mongod(+0xBC3104) [0xfc3104]
       libpthread.so.0(+0x7DC5) [0x7f4f4f748dc5]
       libc.so.6(clone+0x6D) [0x7f4f4e1fbbdd]
      -----  END BACKTRACE  -----
      

      Further down in the traces I see a similar stack but with different error

      2016-02-22T21:07:53.557+0000 I NETWORK  [initandlisten] connection accepted from 10.178.82.244:36048 #8125 (4887 connections now open)
      2016-02-22T21:07:53.560+0000 I NETWORK  [initandlisten] connection accepted from 10.239.128.188:32840 #8126 (4888 connections now open)
      2016-02-22T21:07:53.577+0000 I NETWORK  [initandlisten] Listener: accept() returns -1 errno:24 Too many open files
      2016-02-22T21:07:53.577+0000 E NETWORK  [initandlisten] Out of file descriptors. Waiting one second before trying to accept more connections.
      2016-02-22T21:07:53.587+0000 F -        [conn8118] Got signal: 6 (Aborted).
      
       0xf74fc9 0xf74642 0xf749f6 0x7faddfbd8670 0x7faddfbd85f7 0x7faddfbd9ce8 0xdacd29 0x8ed8a2 0x8ee401 0x8c35e7 0x8e1ce7 0x8e37a6 0x9ced74 0x9cfcfd 0x9d0a0b 0xba1eea 0xab38d0 0x7fb82d 0xf2639b
      0x7fade11e6dc5 0x7faddfc99bdd
      ----- BEGIN BACKTRACE -----
      {"backtrace":[{"b":"400000","o":"B74FC9"},{"b":"400000","o":"B74642"},{"b":"400000","o":"B749F6"},{"b":"7FADDFBA3000","o":"35670"},{"b":"7FADDFBA3000","o":"355F7"},{"b":"7FADDFBA3000","o":"3
      6CE8"},{"b":"400000","o":"9ACD29"},{"b":"400000","o":"4ED8A2"},{"b":"400000","o":"4EE401"},{"b":"400000","o":"4C35E7"},{"b":"400000","o":"4E1CE7"},{"b":"400000","o":"4E37A6"},{"b":"400000","
      o":"5CED74"},{"b":"400000","o":"5CFCFD"},{"b":"400000","o":"5D0A0B"},{"b":"400000","o":"7A1EEA"},{"b":"400000","o":"6B38D0"},{"b":"400000","o":"3FB82D"},{"b":"400000","o":"B2639B"},{"b":"7FA
      DE11DF000","o":"7DC5"},{"b":"7FADDFBA3000","o":"F6BDD"}],"processInfo":{ "mongodbVersion" : "3.0.5", "gitVersion" : "8bc4ae20708dbb493cb09338d9e7be6698e4a3a3", "uname" : { "sysname" : "Linux
      ", "release" : "3.10.37-47.135.amzn1.x86_64", "version" : "#1 SMP Fri Apr 18 03:28:26 UTC 2014", "machine" : "x86_64" }, "somap" : [ { "elfType" : 2, "b" : "400000", "buildId" : "F2642585C8D
      FF37F942ABBAF84DEA258651EC3C8" }, { "b" : "7FFFE1AFE000", "elfType" : 3, "buildId" : "A9D61CE6B4FC467291ED5B3AD5418A1F5DEA012E" }, { "b" : "7FADE11DF000", "path" : "/lib64/libpthread.so.0",
      "elfType" : 3, "buildId" : "E5E575776DAD20ADE8FD0CAF17897C9D89020A87" }, { "b" : "7FADE0F72000", "path" : "/usr/lib64/libssl.so.10", "elfType" : 3, "buildId" : "B949A1349FF0E93409055F00BFD60
      F758EE8FA02" }, { "b" : "7FADE0B8D000", "path" : "/lib64/libcrypto.so.10", "elfType" : 3, "buildId" : "F444116328F54797379DAA3B0FD53CF6C829F22A" }, { "b" : "7FADE0985000", "path" : "/lib64/l
      ibrt.so.1", "elfType" : 3, "buildId" : "42833B65941483A611C40EA7D32F56EA83EA6E93" }, { "b" : "7FADE0781000", "path" : "/lib64/libdl.so.2", "elfType" : 3, "buildId" : "6335077ACD51527BE9F2F18
      451A88E2B7350C5B6" }, { "b" : "7FADE047D000", "path" : "/usr/lib64/libstdc++.so.6", "elfType" : 3, "buildId" : "5E2AE3B2E1D3984B4DE32FE73D221D8C425516E5" }, { "b" : "7FADE017B000", "path" :
      "/lib64/libm.so.6", "elfType" : 3, "buildId" : "BB312C4A65B8FD830C148612CBEACEACC8B08E4F" }, { "b" : "7FADDFF65000", "path" : "/lib64/libgcc_s.so.1", "elfType" : 3, "buildId" : "00FA2883FB47
      B1327397BBF167C52F51A723D013" }, { "b" : "7FADDFBA3000", "path" : "/lib64/libc.so.6", "elfType" : 3, "buildId" : "D84E3AFDFF3E164A09C125F85B5DCABC6F545B5E" }, { "b" : "7FADE13FB000", "path"
      : "/lib64/ld-linux-x86-64.so.2", "elfType" : 3, "buildId" : "7B7BF8FEEF1A9C627EF90CA5C9188EFD4DA2DDD2" }, { "b" : "7FADDF957000", "path" : "/lib64/libgssapi_krb5.so.2", "elfType" : 3, "build
      Id" : "E203354E7F907ACC8C3028FE465541B666DCFBA0" }, { "b" : "7FADDF672000", "path" : "/lib64/libkrb5.so.3", "elfType" : 3, "buildId" : "D769C8FFAF8772FDA55031ABF2E167DF2207E378" }, { "b" : "
      7FADDF46F000", "path" : "/usr/lib64/libcom_err.so.2", "elfType" : 3, "buildId" : "5C01209C5AE1B1714F19B07EB58F2A1274B69DC8" }, { "b" : "7FADDF23D000", "path" : "/lib64/libk5crypto.so.3", "el
      fType" : 3, "buildId" : "6C2243D37143F7FD1E16ED1F6CE4D7F16C2D7EF1" }, { "b" : "7FADDF027000", "path" : "/lib64/libz.so.1", "elfType" : 3, "buildId" : "89C6AF118B6B4FB6A73AE1813E2C8BDD722956D
      1" }, { "b" : "7FADDEE18000", "path" : "/lib64/libkrb5support.so.0", "elfType" : 3, "buildId" : "744272FEAAABCE629AB9E11FAA4A96AEBE8BC2B4" }, { "b" : "7FADDEC15000", "path" : "/lib64/libkeyu
      tils.so.1", "elfType" : 3, "buildId" : "37A58210FA50C91E09387765408A92909468D25B" }, { "b" : "7FADDE9FB000", "path" : "/lib64/libresolv.so.2", "elfType" : 3, "buildId" : "47EC2C63132D25E4FE8
      3F77023DA1A66457A88F1" }, { "b" : "7FADDE7DA000", "path" : "/usr/lib64/libselinux.so.1", "elfType" : 3, "buildId" : "F5054DC94443326819FBF3065CFDF5E4726F57EE" } ] }}
       mongod(_ZN5mongo15printStackTraceERSo+0x29) [0xf74fc9]
       mongod(+0xB74642) [0xf74642]
       mongod(+0xB749F6) [0xf749f6]
       libc.so.6(+0x35670) [0x7faddfbd8670]
       libc.so.6(gsignal+0x37) [0x7faddfbd85f7]
       libc.so.6(abort+0x148) [0x7faddfbd9ce8]
       mongod(_ZN5mongo12SecureRandom6createEv+0x1B9) [0xdacd29]
       mongod(_ZN5mongo31SaslSCRAMSHA1ServerConversation10_firstStepERSt6vectorISsSaISsEEPSs+0x16F2) [0x8ed8a2]
       mongod(_ZN5mongo31SaslSCRAMSHA1ServerConversation4stepERKNS_10StringDataEPSs+0x2F1) [0x8ee401]
      

      Looks like it is crashing with about ~5k connections

      1) Here is my ulimit -a 
      core file size          (blocks, -c) unlimited
      data seg size           (kbytes, -d) unlimited
      scheduling priority             (-e) 0
      file size               (blocks, -f) unlimited
      pending signals                 (-i) 491366
      max locked memory       (kbytes, -l) 64
      max memory size         (kbytes, -m) unlimited
      open files                      (-n) 65536
      pipe size            (512 bytes, -p) 8
      POSIX message queues     (bytes, -q) 819200
      real-time priority              (-r) 0
      stack size              (kbytes, -s) 8192
      cpu time               (seconds, -t) unlimited
      max user processes              (-u) 491366
      virtual memory          (kbytes, -v) unlimited
      file locks                      (-x) unlimited
      
      2)cat /etc/security/limits.conf
      *       soft    nofile  65536
      *       hard    nofile  65536
      *       soft    core unlimited
      
      3) cat /etc/security/limits.d/90-nproc.conf
      *          soft    nproc     65536
      root       soft    nproc     unlimited
      

      The file descriptor limit should be around 65k - Am I missing something here?

            Assignee:
            kelsey.schubert@mongodb.com Kelsey Schubert
            Reporter:
            dharshanr@scalegrid.net Dharshan Rangegowda
            Votes:
            0 Vote for this issue
            Watchers:
            6 Start watching this issue

              Created:
              Updated:
              Resolved: