Hi David, it seems there might be some misconfiguration on the amount of nodes and I might need some explicit settings to account for cluster routing to only hot nodes.
I have 4 'hot' data nodes and 2 'warm' data nodes.
"index" : "index-000003",
"shard" : 0,
"primary" : false,
"current_state" : "started",
"current_node" : {
"id" : "J-k9P8KCTjyZ96S7dffvrw",
"name" : "node-5",
"transport_address" : "192.168.1.8:9300",
"attributes" : {
"ml.machine_memory" : "16510197760",
"ml.max_open_jobs" : "20",
"xpack.installed" : "true",
"data" : "warm"
},
"weight_ranking" : 5
},
"can_remain_on_current_node" : "yes",
"can_rebalance_cluster" : "yes",
"can_rebalance_to_other_node" : "no",
"rebalance_explanation" : "cannot rebalance as no target node exists that can both allocate this shard and improve the cluster balance",
"node_allocation_decisions" : [
{
"node_id" : "huFdb7s0SBKjPqN_6xAnyg",
"node_name" : "node-1",
"transport_address" : "192.168.1.2:9300",
"node_attributes" : {
"ml.machine_memory" : "32144646144",
"ml.max_open_jobs" : "20",
"xpack.installed" : "true",
"data" : "hot"
},
"node_decision" : "no",
"weight_ranking" : 1,
"deciders" : [
{
"decider" : "max_retry",
"decision" : "YES",
"explanation" : "shard has no previous failures"
},
{
"decider" : "replica_after_primary_active",
"decision" : "YES",
"explanation" : "primary shard for this replica is already active"
},
{
"decider" : "enable",
"decision" : "YES",
"explanation" : "all allocations are allowed"
},
{
"decider" : "node_version",
"decision" : "YES",
"explanation" : "can allocate replica shard to a node with version [7.3.1] since this is equal-or-newer than the primary version [7.3.1]"
},
{
"decider" : "snapshot_in_progress",
"decision" : "YES",
"explanation" : "the shard is not being snapshotted"
},
{
"decider" : "restore_in_progress",
"decision" : "YES",
"explanation" : "ignored as shard is not being recovered from a snapshot"
},
{
"decider" : "filter",
"decision" : "YES",
"explanation" : "node passes include/exclude/require filters"
},
{
"decider" : "same_shard",
"decision" : "NO",
"explanation" : "the shard cannot be allocated to the same node on which a copy of the shard already exists [[us-application-logs-000021][0], node[huFdb7s0SBKjPqN_6xAnyg], [P], s[STARTED], a[id=k_2YYC6cTnKXkR3MYciw9A]]"
},
{
"decider" : "disk_threshold",
"decision" : "YES",
"explanation" : "enough disk for shard on node, free: [773.9gb], shard size: [3.9gb], free after allocating shard: [769.9gb]"
},
{
"decider" : "throttling",
"decision" : "YES",
"explanation" : "below shard recovery limit of outgoing: [0 < 2] incoming: [0 < 2]"
},
{
"decider" : "shards_limit",
"decision" : "YES",
"explanation" : "total shard limits are disabled: [index: -1, cluster: -1] <= 0"
},
{
"decider" : "awareness",
"decision" : "NO",
"explanation" : "there are too many copies of the shard allocated to nodes with attribute [data], there are [2] total configured shard copies for this shard id and [2] total attribute values, expected the allocated shard count per attribute [2] to be less than or equal to the upper bound of the required number of shards per attribute [1]"
}
]
}