Metricbeats stops on agents

HI

I have installed Metricbeats 7.2 and filebeats on different windows and linux server. I see metric beats process stops on windows servers with out any error log. Can you please guide how trace whats causing this to stop.

|2019-07-04T14:21:55.520-0700|INFO|[monitoring]|log/log.go:145|Non-zero metrics in the last 30s|{"monitoring": {"metrics": {"beat":{"cpu":{"system":{"ticks":781921,"time":{"ms":140}},"total":{"ticks":1044874,"time":{"ms":234},"value":1044874},"user":{"ticks":262953,"time":{"ms":94}}},"handles":{"open":196},"info":{"ephemeral_id":"53174fb2-b5a9-495a-8530-43b45d78d65d","uptime":{"ms":166230875}},"memstats":{"gc_next":11124912,"memory_alloc":7634856,"memory_total":27351052864},"runtime":{"goroutines":39}},"libbeat":{"config":{"module":{"running":0}},"output":{"events":{"acked":47,"batches":6,"total":47},"read":{"bytes":2328},"write":{"bytes":69191}},"pipeline":{"clients":3,"events":{"active":0,"published":47,"total":47},"queue":{"acked":47}}},"metricbeat":{"system":{"cpu":{"events":3,"success":3},"filesystem":{"events":1,"success":1},"fsstat":{"events":1,"success":1},"memory":{"events":3,"success":3},"network":{"events":9,"success":9},"process":{"events":24,"success":24},"process_summary":{"events":3,"success":3},"socket_summary":{"events":3,"success":3}}}}}}|
|---|---|---|---|---|---|
|2019-07-04T14:22:25.518-0700|INFO|[monitoring]|log/log.go:145|Non-zero metrics in the last 30s|{"monitoring": {"metrics": {"beat":{"cpu":{"system":{"ticks":782046,"time":{"ms":125}},"total":{"ticks":1045014,"time":{"ms":140},"value":1045014},"user":{"ticks":262968,"time":{"ms":15}}},"handles":{"open":196},"info":{"ephemeral_id":"53174fb2-b5a9-495a-8530-43b45d78d65d","uptime":{"ms":166260873}},"memstats":{"gc_next":10641072,"memory_alloc":7313064,"memory_total":27355756912},"runtime":{"goroutines":39}},"libbeat":{"config":{"module":{"running":0}},"output":{"events":{"acked":44,"batches":6,"total":44},"read":{"bytes":2305},"write":{"bytes":64520}},"pipeline":{"clients":3,"events":{"active":0,"published":44,"total":44},"queue":{"acked":44}}},"metricbeat":{"system":{"cpu":{"events":3,"success":3},"memory":{"events":3,"success":3},"network":{"events":9,"success":9},"process":{"events":23,"success":23},"process_summary":{"events":3,"success":3},"socket_summary":{"events":3,"success":3}}}}}}|
|2019-07-04T14:22:55.520-0700|INFO|[monitoring]|log/log.go:145|Non-zero metrics in the last 30s|{"monitoring": {"metrics": {"beat":{"cpu":{"system":{"ticks":782156,"time":{"ms":110}},"total":{"ticks":1045187,"time":{"ms":173},"value":1045187},"user":{"ticks":263031,"time":{"ms":63}}},"handles":{"open":198},"info":{"ephemeral_id":"53174fb2-b5a9-495a-8530-43b45d78d65d","uptime":{"ms":166290874}},"memstats":{"gc_next":11027824,"memory_alloc":7794168,"memory_total":27360931888},"runtime":{"goroutines":39}},"libbeat":{"config":{"module":{"running":0}},"output":{"events":{"acked":45,"batches":6,"total":45},"read":{"bytes":2320},"write":{"bytes":64989}},"pipeline":{"clients":3,"events":{"active":0,"published":45,"total":45},"queue":{"acked":45}}},"metricbeat":{"system":{"cpu":{"events":3,"success":3},"filesystem":{"events":1,"success":1},"fsstat":{"events":1,"success":1},"memory":{"events":3,"success":3},"network":{"events":9,"success":9},"process":{"events":22,"success":22},"process_summary":{"events":3,"success":3},"socket_summary":{"events":3,"success":3}}}}}}|
|2019-07-04T14:23:25.521-0700|INFO|[monitoring]|log/log.go:145|Non-zero metrics in the last 30s|{"monitoring": {"metrics": {"beat":{"cpu":{"system":{"ticks":782312,"time":{"ms":156}},"total":{"ticks":1045374,"time":{"ms":187},"value":1045374},"user":{"ticks":263062,"time":{"ms":31}}},"handles":{"open":196},"info":{"ephemeral_id":"53174fb2-b5a9-495a-8530-43b45d78d65d","uptime":{"ms":166320874}},"memstats":{"gc_next":10339728,"memory_alloc":7422648,"memory_total":27365598400,"rss":12288},"runtime":{"goroutines":39}},"libbeat":{"config":{"module":{"running":0}},"output":{"events":{"acked":43,"batches":6,"total":43},"read":{"bytes":2309},"write":{"bytes":63212}},"pipeline":{"clients":3,"events":{"active":0,"published":43,"total":43},"queue":{"acked":43}}},"metricbeat":{"system":{"cpu":{"events":3,"success":3},"memory":{"events":3,"success":3},"network":{"events":9,"success":9},"process":{"events":22,"success":22},"process_summary":{"events":3,"success":3},"socket_summary":{"events":3,"success":3}}}}}}|
|2019-07-04T14:23:55.521-0700|INFO|[monitoring]|log/log.go:145|Non-zero metrics in the last 30s|{"monitoring": {"metrics": {"beat":{"cpu":{"system":{"ticks":782468,"time":{"ms":156}},"total":{"ticks":1045577,"time":{"ms":203},"value":1045577},"user":{"ticks":263109,"time":{"ms":47}}},"handles":{"open":198},"info":{"ephemeral_id":"53174fb2-b5a9-495a-8530-43b45d78d65d","uptime":{"ms":166350873}},"memstats":{"gc_next":10675120,"memory_alloc":8442920,"memory_total":27370799024,"rss":4096},"runtime":{"goroutines":39}},"libbeat":{"config":{"module":{"running":0}},"output":{"events":{"acked":47,"batches":6,"total":47},"read":{"bytes":2337},"write":{"bytes":67994}},"pipeline":{"clients":3,"events":{"active":0,"published":47,"total":47},"queue":{"acked":47}}},"metricbeat":{"system":{"cpu":{"events":3,"success":3},"filesystem":{"events":1,"success":1},"fsstat":{"events":1,"success":1},"memory":{"events":3,"success":3},"network":{"events":9,"success":9},"process":{"events":24,"success":24},"process_summary":{"events":3,"success":3},"socket_summary":{"events":3,"success":3}}}}}}|
|2019-07-04T14:24:25.523-0700|INFO|[monitoring]|log/log.go:145|Non-zero metrics in the last 30s|{"monitoring": {"metrics": {"beat":{"cpu":{"system":{"ticks":782546,"time":{"ms":78}},"total":{"ticks":1045686,"time":{"ms":109},"value":1045686},"user":{"ticks":263140,"time":{"ms":31}}},"handles":{"open":198},"info":{"ephemeral_id":"53174fb2-b5a9-495a-8530-43b45d78d65d","uptime":{"ms":166380873}},"memstats":{"gc_next":10596208,"memory_alloc":8458448,"memory_total":27375520128,"rss":-102400},"runtime":{"goroutines":39}},"libbeat":{"config":{"module":{"running":0}},"output":{"events":{"acked":45,"batches":6,"total":45},"read":{"bytes":2309},"write":{"bytes":67431}},"pipeline":{"clients":3,"events":{"active":0,"published":45,"total":45},"queue":{"acked":45}}},"metricbeat":{"system":{"cpu":{"events":3,"success":3},"memory":{"events":3,"success":3},"network":{"events":9,"success":9},"process":{"events":24,"success":24},"process_summary":{"events":3,"success":3},"socket_summary":{"events":3,"success":3}}}}}}|
    `indent preformatted text by 4 spaces`

Hi @syedsfayaz, thanks for posting your question here. When you say stop, does it mean Metricbeat crashed and you have to restart it? Does this happen to you constantly and you are able to reproduce? What Metricbeat config are you using?

@Kaiyan_Sheng Yes, Metricbeat crashes and I have to manually restart it. I have seen this issue predominantly in windows.

metricbeat.config.modules:
  # Glob pattern for configuration loading
  path: ${path.config}/modules.d/*.yml

  # Set to true to enable config reloading
  reload.enabled: false

  # Period on which files under path should be checked for changes
  #reload.period: 10s

#==================== Elasticsearch template setting ==========================

setup.template.settings:
  index.number_of_shards: 1
  index.number_of_replicas: 0
  index.codec: best_compression
  _source.enabled: true 

setup.ilm.enabled: auto

# Configure the ILM write alias name.
setup.ilm.rollover_alias: "metricbeat"

# Configure rollover index pattern.
setup.ilm.pattern: "{now/d}-000001"


output.elasticsearch:
  # Array of hosts to connect to.
  hosts: ["example.host.com:9200"]

  # Optional protocol and basic auth credentials.
  #protocol: "https"
  username: "elastic"
  password: "*******"

processors:
  - add_host_metadata: ~
  - add_cloud_metadata: ~

Thanks! Seems like we have a similar issue reported in github several hours ago https://github.com/elastic/beats/issues/12826 for metricbeat crashing.

Thank you.

@Kaiyan_Sheng I see the attached ticket is fixed. Any idea how I can get these changes ?. I went to the downloads page but I see the old date so I am expecting these changes are not released yet.