Everything was chugging along, processing about 2k messages/sec and then
just hanged. Running strace on the process shows the trace below, which
persists even through restarts of elasticsearch. It seems that the issue
occurs right after a clone system call. Ideas?
open("/usr/share/java/elasticsearch/lib/sigar/",
O_RDONLY|O_NONBLOCK|O_DIRECTORY|O_CLOEXEC) = 3
getdents(3, /* 4 entries /, 32768) = 136
getdents(3, / 0 entries */, 32768) = 0
close(3) = 0
mmap(NULL, 135168, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS|MAP_STACK, -1, 0) = 0x7f4c05f79000
mprotect(0x7f4c05f79000, 4096, PROT_NONE) = 0
clone(child_stack=0x7f4c05f98ff0,
flags=CLONE_VM|CLONE_FS|CLONE_FILES|CLONE_SIGHAND|CLONE_THREAD|CLONE_SYSVSEM|CLONE_SETTLS|CLONE_PARENT_SETTID|CLONE_CHILD_CLEARTID,
parent_tidptr=0x7f4c05f999d0, tls=0x7f4c05f99700,
child_tidptr=0x7f4c05f999d0) = 32755
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL) = ? ERESTARTSYS (To be
restarted)
--- SIGINT (Interrupt) @ 0 (0) ---
futex(0x7f4c06c23440, FUTEX_WAKE_PRIVATE, 1) = 1
rt_sigreturn(0x7f4c06c23440) = 202
futex(0x7f4c05f999d0, FUTEX_WAIT, 32755, NULL