Yes, its a master node.
{
"cluster_name" : "BPOConnectElasticSearch",
"status" : "red",
"timed_out" : false,
"number_of_nodes" : 9,
"number_of_data_nodes" : 6,
"active_primary_shards" : 18232,
"active_shards" : 21453,
"relocating_shards" : 0,
"initializing_shards" : 16, --> It got struck
"unassigned_shards" : 15095,
"delayed_unassigned_shards" : 0,
"number_of_pending_tasks" : 4360,
"number_of_in_flight_fetch" : 0,
"task_max_waiting_in_queue_millis" : 4515942,
"active_shards_percent_as_number" : 58.672464719396125
}
Version of ES:-
"name" : "BPOConnectManagementNode",
"cluster_name" : "BPOConnectElasticSearch",
"version" : {
"number" : "2.3.4",
"build_hash" : "e455fd0c13dceca8dbbdbb1665d068ae55dabe3f",
"build_timestamp" : "2016-06-30T11:24:31Z",
"build_snapshot" : false,
"lucene_version" : "5.5.0"
},
"tagline" : "You Know, for Search"
as 'client' nodes were renamed to coordinating nodes quite a while ago --> NO
RAM & Heap size -XGET cluster/stats?human&pretty'
{
"timestamp" : 1596266903468,
"cluster_name" : "BPOConnectElasticSearch",
"status" : "red",
"indices" : {
"count" : 3068,
"shards" : {
"total" : 21653,
"primaries" : 18232,
"replication" : 0.18763712154453707,
"index" : {
"shards" : {
"min" : 1,
"max" : 12,
"avg" : 7.0576923076923075
},
"primaries" : {
"min" : 1,
"max" : 6,
"avg" : 5.942633637548892
},
"replication" : {
"min" : 0.0,
"max" : 1.0,
"avg" : 0.1864189482833549
}
}
},
"docs" : {
"count" : 62036871,
"deleted" : 14
},
"store" : {
"size" : "26gb",
"size_in_bytes" : 27935301698,
"throttle_time" : "0s",
"throttle_time_in_millis" : 0
},
"fielddata" : {
"memory_size" : "0b",
"memory_size_in_bytes" : 0,
"evictions" : 0
},
"query_cache" : {
"memory_size" : "0b",
"memory_size_in_bytes" : 0,
"total_count" : 220641,
"hit_count" : 0,
"miss_count" : 220641,
"cache_size" : 0,
"cache_count" : 0,
"evictions" : 0
},
"completion" : {
"size" : "0b",
"size_in_bytes" : 0
},
"segments" : {
"count" : 98415,
"memory" : "841.9mb",
"memory_in_bytes" : 882895054,
"terms_memory" : "737.3mb",
"terms_memory_in_bytes" : 773116690,
"stored_fields_memory" : "37.9mb",
"stored_fields_memory_in_bytes" : 39759160,
"term_vectors_memory" : "0b",
"term_vectors_memory_in_bytes" : 0,
"norms_memory" : "15.2mb",
"norms_memory_in_bytes" : 16017472,
"doc_values_memory" : "51.5mb",
"doc_values_memory_in_bytes" : 54001732,
"index_writer_memory" : "0b",
"index_writer_memory_in_bytes" : 0,
"index_writer_max_memory" : "12.8gb",
"index_writer_max_memory_in_bytes" : 13768130560,
"version_map_memory" : "0b",
"version_map_memory_in_bytes" : 0,
"fixed_bit_set" : "0b",
"fixed_bit_set_memory_in_bytes" : 0
},
"percolate" : {
"total" : 0,
"time" : "0s",
"time_in_millis" : 0,
"current" : 0,
"memory_size_in_bytes" : -1,
"memory_size" : "-1b",
"queries" : 0
}
},
"nodes" : {
"count" : {
"total" : 7,
"master_only" : 1,
"data_only" : 1,
"master_data" : 5,
"client" : 0
},
"versions" : [ "2.3.4" ],
"os" : {
"available_processors" : 56,
"allocated_processors" : 56,
"mem" : {
"total" : "125.4gb",
"total_in_bytes" : 134660542464
},
"names" : [ {
"name" : "Linux",
"count" : 7
} ]
},
"process" : {
"cpu" : {
"percent" : 23
},
"open_file_descriptors" : {
"min" : 400,
"max" : 72903,
"avg" : 28032
}
},
"jvm" : {
"max_uptime" : "2h",
"max_uptime_in_millis" : 7531566,
"versions" : [ {
"version" : "1.8.0_121",
"vm_name" : "OpenJDK 64-Bit Server VM",
"vm_version" : "25.121-b13",
"vm_vendor" : "Oracle Corporation",
"count" : 4
}, {
"version" : "1.8.0_151",
"vm_name" : "OpenJDK 64-Bit Server VM",
"vm_version" : "25.151-b12",
"vm_vendor" : "Oracle Corporation",
"count" : 3
} ],
"mem" : {
"heap_used" : "44.3gb",
"heap_used_in_bytes" : 47587332584,
"heap_max" : "149.5gb",
"heap_max_in_bytes" : 160573161472
},
"threads" : 621
},
"fs" : {
"total" : "1023.6gb",
"total_in_bytes" : 1099166326784,
"free" : "958.4gb",
"free_in_bytes" : 1029079048192,
"available" : "934.4gb",
"available_in_bytes" : 1003326205952,
"spins" : "true"
},
"plugins" :
Master is always stable. Only Client node is getting out from cluster. No its not in cloud its a normal virtual machine which hosted in DC.
Client Node Log
[INFO ][cluster.service ] [BPOConnectClientNode01] detected_master {BPOConnectDataNode05}{DwFeVQAXT1e7OvAWzJl2xg}{10.46.XX.XX}{10.46.xx.xx:9300}{master=true}, added {{BPOConnectDataNode02}{lWiurDCdQBeBlKEaqOKB1Q}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true},{BPOConnectDataNode01}{6L30R7wNSk-cF6IonxFQXw}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true},{BPOConnectClientNode02}{WoJeRKDNQYCfJzA3Ht22RA}{10.46.xx.xx}{10.46.xx.xx:9300}{data=false, master=false},{BPOConnectDataNode05}{DwFeVQAXT1e7OvAWzJl2xg}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true},{BPOConnectClientNode01}{QWTeWqHtS_ChB-qTI0huUQ}{10.46.xx.xx}{10.46.xx.xx:9300}{data=false, master=false},{BPOConnectDataNode06}{FKyK7eILRfOqd_0-YT0l6w}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true},{BPOConnectDataNode03}{E-pvqVh7QXms_8A9EmlJjg}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true},{BPOConnectManagementNode}{pqGpyZVQQLaTHBlp_11r_Q}{10.46.xx.xx}{10.46.xx.xx:9300}{data=false, master=true},{BPOConnectClientNode02}{7LiimhjoR7GIwtsB2oF9fg}{10.46.xx.xx}{10.46.xx.xx:9300}{data=false, master=false},{BPOConnectDataNode04}{NZ1m1vLAQMCZnQ_1MYxYNQ}{10.46.xx.xx}{10.46.xx.xx:9300}{master=false},}, reason: zen-disco-receive(from master [{BPOConnectDataNode05}{DwFeVQAXT1e7OvAWzJl2xg}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true}])
[INFO ][cluster.service ] [BPOConnectClientNode01] removed {{BPOConnectClientNode01}{QWTeWqHtS_ChB-qTI0huUQ}{10.46.xx.xx}{10.46.xx.xx:9300}{data=false, master=false},}, reason: zen-disco-receive(from master [{BPOConnectDataNode05}{DwFeVQAXT1e7OvAWzJl2xg}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true}])
[INFO ][cluster.service ] [BPOConnectClientNode01] removed {{BPOConnectClientNode02}{7LiimhjoR7GIwtsB2oF9fg}{10.46.xx.xx}{10.46.xx.xx:9300}{data=false, master=false},}, reason: zen-disco-receive(from master [{BPOConnectDataNode05}{DwFeVQAXT1e7OvAWzJl2xg}{10.46.xx.xx}{10.46.xx.xx:9300}{master=true}])
Note: We have 6 data node with 35000 shards. 1 master node 5 eligible master node.
After restart of cluster "initializing_shards" got struck and its not doing anything.
Pls Help !!