Thanks for the feedback that's really great. I can't say for certain what the cluster was being used for at that moment unfortunately, as we have multiple users with access that could be querying for data. We do get a fairly regular stream of incoming data from 4 domain controllers (Windows winlogbeat), 4 Mail Servers (Exchange logs via winlogbeat and filebeat) and a SYSLOG source. I wonder if the environment is not properly specified to handle the load of additional queries on top of that, and I could make some changes?
The 3 ES data/master nodes were configured with 2 vCPU and 4GB RAM, with 3GB assigned for ES heap. I've just upped the spec on all 3 nodes to 4 vCPU and 6GB RAM, with 4GB assigned for ES heap. Would I be right in saying that the ES JVM heap size influences the number of shards that are supportable, so a low heap with high shard count will perform poorly or maybe even grind down to a halt?
With regard to swap, this was enabled by default on my VMware VM Ubuntu template. I've disabled this now and restarted all the VMs to bring them back to in-memory only.
Thanks again, really appreciate it.
P.S. For reference, if the cluster stats output with shard count helps influence sizing discussions:
Summary
{
"_nodes" : {
"total" : 5,
"successful" : 5,
"failed" : 0
},
"cluster_name" : "es-prdcluster",
"cluster_uuid" : "Gtx-g6EBS6WSSqkCgpxIKw",
"timestamp" : 1583337133416,
"status" : "yellow",
"indices" : {
"count" : 86,
"shards" : {
"total" : 449,
"primaries" : 248,
"replication" : 0.8104838709677419,
"index" : {
"shards" : {
"min" : 1,
"max" : 6,
"avg" : 5.22093023255814
},
"primaries" : {
"min" : 1,
"max" : 3,
"avg" : 2.883720930232558
},
"replication" : {
"min" : 0.0,
"max" : 1.0,
"avg" : 0.8023255813953488
}
}
},
"docs" : {
"count" : 237410357,
"deleted" : 3165647
},
"store" : {
"size" : "475.4gb",
"size_in_bytes" : 510474672954
},
"fielddata" : {
"memory_size" : "0b",
"memory_size_in_bytes" : 0,
"evictions" : 0
},
"query_cache" : {
"memory_size" : "0b",
"memory_size_in_bytes" : 0,
"total_count" : 0,
"hit_count" : 0,
"miss_count" : 0,
"cache_size" : 0,
"cache_count" : 0,
"evictions" : 0
},
"completion" : {
"size" : "0b",
"size_in_bytes" : 0
},
"segments" : {
"count" : 6729,
"memory" : "499.4mb",
"memory_in_bytes" : 523679947,
"terms_memory" : "225.8mb",
"terms_memory_in_bytes" : 236805394,
"stored_fields_memory" : "229.4mb",
"stored_fields_memory_in_bytes" : 240621760,
"term_vectors_memory" : "0b",
"term_vectors_memory_in_bytes" : 0,
"norms_memory" : "3.9kb",
"norms_memory_in_bytes" : 4032,
"points_memory" : "22.8mb",
"points_memory_in_bytes" : 23988045,
"doc_values_memory" : "21.2mb",
"doc_values_memory_in_bytes" : 22260716,
"index_writer_memory" : "92.9mb",
"index_writer_memory_in_bytes" : 97469900,
"version_map_memory" : "2.6mb",
"version_map_memory_in_bytes" : 2782834,
"fixed_bit_set" : "2.5mb",
"fixed_bit_set_memory_in_bytes" : 2676928,
"max_unsafe_auto_id_timestamp" : 1583336925190,
"file_sizes" : { }
}
},
"nodes" : {
"count" : {
"total" : 5,
"coordinating_only" : 1,
"data" : 3,
"ingest" : 2,
"master" : 3,
"ml" : 0,
"voting_only" : 0
},
"versions" : [
"7.5.2"
],
"os" : {
"available_processors" : 16,
"allocated_processors" : 16,
"names" : [
{
"name" : "Linux",
"count" : 5
}
],
"pretty_names" : [
{
"pretty_name" : "Ubuntu 18.04.2 LTS",
"count" : 5
}
],
"mem" : {
"total" : "27.1gb",
"total_in_bytes" : 29138182144,
"free" : "702.6mb",
"free_in_bytes" : 736747520,
"used" : "26.4gb",
"used_in_bytes" : 28401434624,
"free_percent" : 3,
"used_percent" : 97
}
},
"process" : {
"cpu" : {
"percent" : 9
},
"open_file_descriptors" : {
"min" : 309,
"max" : 42490,
"avg" : 18780
}
},
"jvm" : {
"max_uptime" : "5.5h",
"max_uptime_in_millis" : 19991310,
"versions" : [
{
"version" : "13.0.1",
"vm_name" : "OpenJDK 64-Bit Server VM",
"vm_version" : "13.0.1+9",
"vm_vendor" : "AdoptOpenJDK",
"bundled_jdk" : true,
"using_bundled_jdk" : true,
"count" : 5
}
],
"mem" : {
"heap_used" : "3.2gb",
"heap_used_in_bytes" : 3486837528,
"heap_max" : "16.8gb",
"heap_max_in_bytes" : 18114150400
},
"threads" : 292
},
"fs" : {
"total" : "976.8gb",
"total_in_bytes" : 1048904966144,
"free" : "422.3gb",
"free_in_bytes" : 453460488192,
"available" : "375.3gb",
"available_in_bytes" : 403061383168
},
"plugins" : ,
"network_types" : {
"transport_types" : {
"security4" : 5
},
"http_types" : {
"security4" : 5
}
},
"discovery_types" : {
"zen" : 5
},
"packaging_types" : [
{
"flavor" : "default",
"type" : "deb",
"count" : 5
}
]
}
}