Alerts

task_high_memory_usage_1g (9 active)
alert: task_high_memory_usage_1g
expr: sum
  by(container_label_com_docker_swarm_task_name, container_label_com_docker_swarm_node_id)
  (container_memory_rss{container_label_com_docker_swarm_task_name=~".+"})
  > 1e+09
for: 1m
annotations:
  description: '{{ $labels.container_label_com_docker_swarm_task_name }} on '{{
    $labels.container_label_com_docker_swarm_node_id }}' memory usage is {{ humanize
    $value}}.'
  summary: Memory alert for Swarm task '{{ $labels.container_label_com_docker_swarm_task_name
    }}' on '{{ $labels.container_label_com_docker_swarm_node_id }}'
Labels State Active Since Value
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-stage_mariadb.1.w5pp8rpy8jed7pri3wcmhhlga" firing 2024-11-26 01:46:03.069511962 +0000 UTC 3.795226624e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-stress_db.1.sxyiswnwwqconle56doryctpd" firing 2024-11-26 01:46:03.069511962 +0000 UTC 2.594902016e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-dev4_db.1.z30jtew2yp5bg8bgwqigt1t7q" firing 2024-11-26 01:45:48.069511962 +0000 UTC 2.778005504e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-dev2_db.1.xxjx247yu3kro8smbxqqxxkl4" firing 2024-11-26 01:45:48.069511962 +0000 UTC 3.084939264e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-we-dev1_db.1.d2m4m9pwbzfx280zm5ukx8k2x" firing 2024-11-26 01:46:03.069511962 +0000 UTC 2.510020608e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-dev1_db.1.6ljc794c0c9901bj7glk3blqp" firing 2024-11-26 01:46:03.069511962 +0000 UTC 2.88905216e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-dev3_db.1.l4tlwiptyf4v32m8ad94jy76c" firing 2024-11-26 01:46:18.069511962 +0000 UTC 2.856185856e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-we-stage_db.1.o9fz5ciht8rj56uo4xivv1ilf" firing 2024-11-26 01:46:33.069511962 +0000 UTC 2.311110656e+09
alertname="task_high_memory_usage_1g" container_label_com_docker_swarm_node_id="zn6molvsehr5g0mfoutenztux" container_label_com_docker_swarm_task_name="alpina-we-dev2_db.1.yoen5w9xtswkwvawihinepox2" firing 2024-11-26 01:45:48.069511962 +0000 UTC 2.344579072e+09
node_cpu_usage (0 active)
alert: node_cpu_usage
expr: 100
  - (avg by(node_name) (irate(node_cpu_seconds_total{mode="idle"}[1m]) * on(instance)
  group_left(node_name) node_meta * 100)) > 50
for: 1m
labels:
  severity: warning
annotations:
  description: Swarm node {{ $labels.node_name }} CPU usage is at {{ humanize $value}}%.
  summary: CPU alert for Swarm node '{{ $labels.node_name }}'
node_disk_fill_rate_6h (0 active)
alert: node_disk_fill_rate_6h
expr: predict_linear(node_filesystem_free_bytes{mountpoint="/rootfs"}[1h],
  6 * 3600) * on(instance) group_left(node_name) node_meta < 0
for: 1h
labels:
  severity: critical
annotations:
  description: Swarm node {{ $labels.node_name }} disk is going to fill up in 6h.
  summary: Disk fill alert for Swarm node '{{ $labels.node_name }}'
node_disk_usage (0 active)
alert: node_disk_usage
expr: ((node_filesystem_size_bytes{mountpoint="/rootfs"}
  - node_filesystem_free_bytes{mountpoint="/rootfs"}) * 100 / node_filesystem_size_bytes{mountpoint="/rootfs"})
  * on(instance) group_left(node_name) node_meta > 85
for: 1m
labels:
  severity: warning
annotations:
  description: Swarm node {{ $labels.node_name }} disk usage is at {{ humanize $value}}%.
  summary: Disk alert for Swarm node '{{ $labels.node_name }}'
node_memory_usage (0 active)
alert: node_memory_usage
expr: sum
  by(node_name) (((node_memory_MemTotal_bytes - node_memory_MemAvailable_bytes) /
  node_memory_MemTotal_bytes) * on(instance) group_left(node_name) node_meta * 100)
  > 80
for: 1m
labels:
  severity: warning
annotations:
  description: Swarm node {{ $labels.node_name }} memory usage is at {{ humanize $value}}%.
  summary: Memory alert for Swarm node '{{ $labels.node_name }}'
task_high_cpu_usage_50 (0 active)
alert: task_high_cpu_usage_50
expr: sum
  by(container_label_com_docker_swarm_task_name, container_label_com_docker_swarm_node_id)
  (rate(container_cpu_usage_seconds_total{container_label_com_docker_swarm_task_name=~".+"}[1m]))
  * 100 > 50
for: 1m
annotations:
  description: '{{ $labels.container_label_com_docker_swarm_task_name }} on '{{
    $labels.container_label_com_docker_swarm_node_id }}' CPU usage is at {{ humanize
    $value}}%.'
  summary: CPU alert for Swarm task '{{ $labels.container_label_com_docker_swarm_task_name
    }}' on '{{ $labels.container_label_com_docker_swarm_node_id }}'