In terms of filebeat monitoring:
What is the difference between libbeat.output VS libbeat.pipeline?
Is a non-zero libbeat.output.failed a cause for concern? Are we losing data?
We are using Filebeat 7.4.1 in production shipping metrics as per configuration:
filebeat.autodiscover:
providers:
- type: kubernetes
...
processors:
- add_cloud_metadata: ~
- add_docker_metadata: ~
.....
monitoring:
enabled: true
We have observed very detailed metrics around filebeat output such as this generated event (see below).
"beats_stats": {
"metrics": {
"registrar": {
"writes": {
"success": 1159964,
"total": 1159964,
"fail": 0
},
"states": {
"cleanup": 175,
"current": 92,
"update": 13382777
}
},
"filebeat": {
"events": {
"added": 13382781,
"done": 13382777,
"active": 4
},
"harvester": {
"closed": 1282,
"running": 7,
"open_files": 7,
"skipped": 0,
"started": 1289
},
"input": {
"netflow": {
"packets": {
"received": 0,
"dropped": 0
},
"flows": 0
},
"log": {
"files": {
"renamed": 0,
"truncated": 0
}
}
}
},
"libbeat": {
"pipeline": {
"clients": 37,
"events": {
"retry": 79623,
"active": 4,
"total": 13382781,
"filtered": 2863,
"published": 13379918,
"failed": 0,
"dropped": 0
},
"queue": {
"acked": 13379914
}
},
"config": {
"reloads": 0,
"module": {
"running": 0,
"starts": 0,
"stops": 0
}
},
"output": {
"events": {
"active": 21,
"toomany": 33147,
"batches": 1159990,
"total": 13413082,
"acked": 13379914,
"failed": 33147,
"dropped": 0,
"duplicates": 0
},
"write": {
"bytes": 39927190886,
"errors": 0
},
"read": {
"errors": 0,
"bytes": 3115564222
},
"type": "elasticsearch"
}
},
"system": {
"load": {
"1": 0.1,
"5": 0.11,
"15": 0.16,
"norm": {
"1": 0.0063,
"5": 0.0069,
"15": 0.01
}
},
"cpu": {
"cores": 16
}
},
"beat": {
"info": {
"uptime": {
"ms": 2406820129
},
"ephemeral_id": "dbc0e27c-9743-4b4b-9b3c-6a38478e198a"
},
"memstats": {
"gc_next": 50187360,
"rss": 170217472,
"memory_total": 840912263792,
"memory_alloc": 25784432
},
"cpu": {
"user": {
"time": {
"ms": 10803749
},
"ticks": 10803740
},
"system": {
"time": {
"ms": 9171426
},
"ticks": 9171420
},
"total": {
"time": {
"ms": 19975175
},
"value": 19975160,
"ticks": 19975160
}
},
"runtime": {
"goroutines": 299
},
"handles": {
"open": 21,
"limit": {
"soft": 1048576,
"hard": 1048576
}
}
}
}