My apologies for that tone, my emotions got the best of me.
Since this discussion started, I bounced the node that had all the primary shards so that the primaries would distribute a bit. The primaries are still "clumping", but recovery is faster. This is from our new cluster, it has about a 1/4 sample from our existing cluster.
Given things have changed, I do not know if _recovery
will provide you with any information, but here it is:
{
"unittest20180325_000000":{"shards":[{
"id":12,
"type":"PEER",
"stage":"INDEX",
"primary":false,
"start_time":"2018-04-10T10:47:01.290Z",
"start_time_in_millis":1523357221290,
"total_time":"1.5m",
"total_time_in_millis":92397,
"source":{
"id":"OpYrgkLLR6W_GZsML08Kzw",
"host":"172.31.1.41",
"transport_address":"172.31.1.41:9300",
"ip":"172.31.1.41",
"name":"spot_172.31.1.41"
},
"target":{
"id":"fB2lIO3AShmS_Mu7_db6kw",
"host":"172.31.1.133",
"transport_address":"172.31.1.133:9300",
"ip":"172.31.1.133",
"name":"spot_172.31.1.133"
},
"index":{
"size":{
"total":"5.1gb",
"total_in_bytes":5553993709,
"reused":"0b",
"reused_in_bytes":0,
"recovered":"1.5gb",
"recovered_in_bytes":1651615562,
"percent":"29.7%"
},
"files":{"total":117,"reused":0,"recovered":110,"percent":"94.0%"},
"total_time":"1.5m",
"total_time_in_millis":92392,
"source_throttle_time":"0s",
"source_throttle_time_in_millis":0,
"target_throttle_time":"0s",
"target_throttle_time_in_millis":0
},
"translog":{
"recovered":0,
"total":0,
"percent":"100.0%",
"total_on_start":0,
"total_time":"0s",
"total_time_in_millis":0
},
"verify_index":{
"check_index_time":"0s",
"check_index_time_in_millis":0,
"total_time":"0s",
"total_time_in_millis":0
}
}]},
"unittest20180401_000000":{"shards":[
{
"id":29,
"type":"PEER",
"stage":"INDEX",
"primary":true,
"start_time":"2018-04-10T10:44:16.083Z",
"start_time_in_millis":1523357056083,
"total_time":"4.2m",
"total_time_in_millis":257607,
"source":{
"id":"tGN6xh4EQe-cMdEm0G3ZCg",
"host":"172.31.1.161",
"transport_address":"172.31.1.161:9300",
"ip":"172.31.1.161",
"name":"spot_172.31.1.161"
},
"target":{
"id":"leqOW1llRq-7s_amdj9rhA",
"host":"172.31.1.235",
"transport_address":"172.31.1.235:9300",
"ip":"172.31.1.235",
"name":"spot_172.31.1.161"
},
"index":{
"size":{
"total":"5.1gb",
"total_in_bytes":5489771388,
"reused":"0b",
"reused_in_bytes":0,
"recovered":"4.9gb",
"recovered_in_bytes":5278959664,
"percent":"96.2%"
},
"files":{"total":129,"reused":0,"recovered":128,"percent":"99.2%"},
"total_time":"4.2m",
"total_time_in_millis":256860,
"source_throttle_time":"0s",
"source_throttle_time_in_millis":0,
"target_throttle_time":"0s",
"target_throttle_time_in_millis":0
},
"translog":{
"recovered":0,
"total":6618,
"percent":"0.0%",
"total_on_start":6565,
"total_time":"0s",
"total_time_in_millis":0
},
"verify_index":{
"check_index_time":"0s",
"check_index_time_in_millis":0,
"total_time":"0s",
"total_time_in_millis":0
}
},
{
"id":4,
"type":"PEER",
"stage":"INDEX",
"primary":true,
"start_time":"2018-04-10T10:35:58.794Z",
"start_time_in_millis":1523356558794,
"total_time":"12.5m",
"total_time_in_millis":754889,
"source":{
"id":"rNtDq87WQhWaHsKlbZRPzw",
"host":"172.31.1.76",
"transport_address":"172.31.1.76:9300",
"ip":"172.31.1.76",
"name":"spot_172.31.1.76"
},
"target":{
"id":"eLdwRD2RR7SmkJWkelrdhw",
"host":"172.31.1.163",
"transport_address":"172.31.1.163:9300",
"ip":"172.31.1.163",
"name":"spot_172.31.1.76"
},
"index":{
"size":{
"total":"5gb",
"total_in_bytes":5469790162,
"reused":"0b",
"reused_in_bytes":0,
"recovered":"5gb",
"recovered_in_bytes":5391906410,
"percent":"98.6%"
},
"files":{"total":124,"reused":0,"recovered":123,"percent":"99.2%"},
"total_time":"12.5m",
"total_time_in_millis":753338,
"source_throttle_time":"213.5ms",
"source_throttle_time_in_millis":213,
"target_throttle_time":"0s",
"target_throttle_time_in_millis":0
},
"translog":{
"recovered":0,
"total":17026,
"percent":"0.0%",
"total_on_start":16983,
"total_time":"0s",
"total_time_in_millis":0
},
"verify_index":{
"check_index_time":"0s",
"check_index_time_in_millis":0,
"total_time":"0s",
"total_time_in_millis":0
}
}
]}
}