Hi all,
Elasticsearch application failed due to jvm errors. i tried to fix that changing: esJavaOpts: "-Xmx8g -Xms8g" in yaml file. unfortunately this did not help. In general the app is bases on 3 servers with 8 cpu and 32GB and a big NFS storage.
Please assist.
{"type": "server", "timestamp": "2021-07-19T18:48:05,588Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23103] overhead, spent [525ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:48:45,195Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23141] overhead, spent [287ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:49:18,185Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23173] overhead, spent [271ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:49:56,697Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23211] overhead, spent [360ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:50:26,002Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23240] overhead, spent [374ms] collecting in the last [1.1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:50:53,397Z", "level": "WARN", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23267] overhead, spent [563ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:53:48,590Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23439] overhead, spent [292ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:54:26,595Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23476] overhead, spent [315ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:55:03,390Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23512] overhead, spent [258ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:56:08,988Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23577] overhead, spent [467ms] collecting in the last [1.2s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:58:05,237Z", "level": "INFO", "component": "o.e.c.s.ClusterApplierService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "added {{elasticsearch-master-2}{fNZ2A7YhSK6Xj1BdrhYzbg}{S2SwXydVSOmI_G3ubnQFhQ}{10.42.0.166}{10.42.0.166:9300}{cdfhilmrstw}{ml.machine_memory=25769803776, ml.max_open_jobs=20, xpack.installed=true, ml.max_jvm_size=2147483648, transform.node=true}}, term: 160, version: 174966, reason: ApplyCommitRequest{term=160, version=174966, sourceNode={elasticsearch-master-1}{jOBr_EBpTKCP-O9qPBAQCg}{TY8G2-_4QTCZ02d2ne7tug}{10.42.1.243}{10.42.1.243:9300}{cdfhilmrstw}{ml.machine_memory=10737418240, ml.max_open_jobs=20, xpack.installed=true, ml.max_jvm_size=8589934592, transform.node=true}}", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:58:40,140Z", "level": "WARN", "component": "o.e.t.TransportService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "Received response for a request that has timed out, sent [18.6s/18694ms] ago, timed out [8.8s/8815ms] ago, action [internal:coordination/fault_detection/leader_check], node [{elasticsearch-master-1}{jOBr_EBpTKCP-O9qPBAQCg}{TY8G2-_4QTCZ02d2ne7tug}{10.42.1.243}{10.42.1.243:9300}{cdfhilmrstw}{ml.machine_memory=10737418240, ml.max_open_jobs=20, xpack.installed=true, ml.max_jvm_size=8589934592, transform.node=true}], id [5306751]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:59:01,966Z", "level": "INFO", "component": "o.e.m.j.JvmGcMonitorService", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "[gc][23749] overhead, spent [262ms] collecting in the last [1s]", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" }
{"type": "server", "timestamp": "2021-07-19T18:59:26,036Z", "level": "INFO", "component": "o.e.c.c.Coordinator", "cluster.name": "elasticsearch", "node.name": "elasticsearch-master-0", "message": "master node [{elasticsearch-master-1}{jOBr_EBpTKCP-O9qPBAQCg}{TY8G2-_4QTCZ02d2ne7tug}{10.42.1.243}{10.42.1.243:9300}{cdfhilmrstw}{ml.machine_memory=10737418240, ml.max_open_jobs=20, xpack.installed=true, ml.max_jvm_size=8589934592, transform.node=true}] failed, restarting discovery", "cluster.uuid": "JU99REOhRxa8BEoy2Ib1Gg", "node.id": "cuF0wFv2T1a_g64EBFvgPw" ,
"stacktrace": ["org.elasticsearch.ElasticsearchException: node [{elasticsearch-master-1}{jOBr_EBpTKCP-O9qPBAQCg}{TY8G2-_4QTCZ02d2ne7tug}{10.42.1.243}{10.42.1.243:9300}{cdfhilmrstw}{ml.machine_memory=10737418240, ml.max_open_jobs=20, xpack.installed=true, ml.max_jvm_size=8589934592, transform.node=true}] failed [3] consecutive checks",
"at org.elasticsearch.cluster.coordination.LeaderChecker$CheckScheduler$1.handleException(LeaderChecker.java:275) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.TransportService$ContextRestoreResponseHandler.handleException(TransportService.java:1290) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.TransportService$ContextRestoreResponseHandler.handleException(TransportService.java:1290) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundHandler.lambda$handleException$3(InboundHandler.java:317) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.common.util.concurrent.EsExecutors$DirectExecutorService.execute(EsExecutors.java:215) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundHandler.handleException(InboundHandler.java:315) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundHandler.handlerResponseError(InboundHandler.java:307) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundHandler.messageReceived(InboundHandler.java:126) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundHandler.inboundMessage(InboundHandler.java:84) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.TcpTransport.inboundMessage(TcpTransport.java:690) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundPipeline.forwardFragments(InboundPipeline.java:131) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundPipeline.doHandleBytes(InboundPipeline.java:106) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.InboundPipeline.handleBytes(InboundPipeline.java:71) ~[elasticsearch-7.12.1.jar:7.12.1]",
"at org.elasticsearch.transport.netty4.Netty4MessageChannelHandler.channelRead(Netty4MessageChannelHandler.java:63) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.invokeChannelRead(AbstractChannelHandlerContext.java:379) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.invokeChannelRead(AbstractChannelHandlerContext.java:365) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.fireChannelRead(AbstractChannelHandlerContext.java:357) ~[?:?]",
"at io.netty.handler.logging.LoggingHandler.channelRead(LoggingHandler.java:271) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.invokeChannelRead(AbstractChannelHandlerContext.java:379) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.invokeChannelRead(AbstractChannelHandlerContext.java:365) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.fireChannelRead(AbstractChannelHandlerContext.java:357) ~[?:?]",
"at io.netty.channel.DefaultChannelPipeline$HeadContext.channelRead(DefaultChannelPipeline.java:1410) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.invokeChannelRead(AbstractChannelHandlerContext.java:379) ~[?:?]",
"at io.netty.channel.AbstractChannelHandlerContext.invokeChannelRead(AbstractChannelHandlerContext.java:365) ~[?:?]",
"at io.netty.channel.DefaultChannelPipeline.fireChannelRead(DefaultChannelPipeline.java:919) ~[?:?]",
"at io.netty.channel.nio.AbstractNioByteChannel$NioByteUnsafe.read(AbstractNioByteChannel.java:163) ~[?:?]",
"at io.netty.channel.nio.NioEventLoop.processSelectedKey(NioEventLoop.java:714) ~[?:?]",
"at io.netty.channel.nio.NioEventLoop.processSelectedKeysPlain(NioEventLoop.java:615) ~[?:?]",
"at io.netty.channel.nio.NioEventLoop.processSelectedKeys(NioEventLoop.java:578) ~[?:?]",
"at io.netty.channel.nio.NioEventLoop.run(NioEventLoop.java:493) ~[?:?]",
"at io.netty.util.concurrent.SingleThreadEventExecutor$4.run(SingleThreadEventExecutor.java:989) ~[?:?]",
"at io.netty.util.internal.ThreadExecutorMap$2.run(ThreadExecutorMap.java:74) ~[?:?]",
"at java.lang.Thread.run(Thread.java:831) [?:?]",