Loading docker-compose.tmpl.yml +1 −1 Original line number Diff line number Diff line Loading @@ -256,4 +256,4 @@ configs: file: ./swarmprom/prometheus/rules/swarm_node.rules.yml task_rules: file: ./swarmprom/prometheus/rules/swarm_task.rules.yml file: ./prometheus/rules/swarm_task.rules.yml prometheus/rules/swarm_task.rules.yml 0 → 100644 +32 −0 Original line number Diff line number Diff line groups: - name: /1/store/projects/vagrant/docker-swarm-vagrant/apps/swarmprom/prometheus/rules/swarm_task.rules.yml rules: - alert: task_high_cpu_usage_50 expr: sum(rate(container_cpu_usage_seconds_total{container_label_com_docker_swarm_task_name=~".+"}[1m])) BY (container_label_com_docker_swarm_task_name, container_label_com_docker_swarm_node_id) * 100 > 50 for: 1m annotations: description: '{{ $labels.container_label_com_docker_swarm_task_name }} on ''{{ $labels.container_label_com_docker_swarm_node_id }}'' CPU usage is at {{ humanize $value}}%.' summary: CPU alert for Swarm task '{{ $labels.container_label_com_docker_swarm_task_name }}' on '{{ $labels.container_label_com_docker_swarm_node_id }}' - alert: task_high_memory_usage_1g expr: sum(container_memory_rss{container_label_com_docker_swarm_task_name=~".+"}) BY (container_label_com_docker_swarm_task_name, container_label_com_docker_swarm_node_id) > 1e+09 for: 1m annotations: description: '{{ $labels.container_label_com_docker_swarm_task_name }} on ''{{ $labels.container_label_com_docker_swarm_node_id }}'' memory usage is {{ humanize $value}}.' summary: Memory alert for Swarm task '{{ $labels.container_label_com_docker_swarm_task_name }}' on '{{ $labels.container_label_com_docker_swarm_node_id }}' - alert: backup_db_not_created expr: time() - backup_created_date_seconds{exported_job="vessel-db", label="ais-db"} > 86400 labels: severity: warning annotations: description: "'{{ $labels.exported_job }}' database backup was not created." summary: "'{{ $labels.label }}' database backup was not created." No newline at end of file Loading
docker-compose.tmpl.yml +1 −1 Original line number Diff line number Diff line Loading @@ -256,4 +256,4 @@ configs: file: ./swarmprom/prometheus/rules/swarm_node.rules.yml task_rules: file: ./swarmprom/prometheus/rules/swarm_task.rules.yml file: ./prometheus/rules/swarm_task.rules.yml
prometheus/rules/swarm_task.rules.yml 0 → 100644 +32 −0 Original line number Diff line number Diff line groups: - name: /1/store/projects/vagrant/docker-swarm-vagrant/apps/swarmprom/prometheus/rules/swarm_task.rules.yml rules: - alert: task_high_cpu_usage_50 expr: sum(rate(container_cpu_usage_seconds_total{container_label_com_docker_swarm_task_name=~".+"}[1m])) BY (container_label_com_docker_swarm_task_name, container_label_com_docker_swarm_node_id) * 100 > 50 for: 1m annotations: description: '{{ $labels.container_label_com_docker_swarm_task_name }} on ''{{ $labels.container_label_com_docker_swarm_node_id }}'' CPU usage is at {{ humanize $value}}%.' summary: CPU alert for Swarm task '{{ $labels.container_label_com_docker_swarm_task_name }}' on '{{ $labels.container_label_com_docker_swarm_node_id }}' - alert: task_high_memory_usage_1g expr: sum(container_memory_rss{container_label_com_docker_swarm_task_name=~".+"}) BY (container_label_com_docker_swarm_task_name, container_label_com_docker_swarm_node_id) > 1e+09 for: 1m annotations: description: '{{ $labels.container_label_com_docker_swarm_task_name }} on ''{{ $labels.container_label_com_docker_swarm_node_id }}'' memory usage is {{ humanize $value}}.' summary: Memory alert for Swarm task '{{ $labels.container_label_com_docker_swarm_task_name }}' on '{{ $labels.container_label_com_docker_swarm_node_id }}' - alert: backup_db_not_created expr: time() - backup_created_date_seconds{exported_job="vessel-db", label="ais-db"} > 86400 labels: severity: warning annotations: description: "'{{ $labels.exported_job }}' database backup was not created." summary: "'{{ $labels.label }}' database backup was not created." No newline at end of file