|
|
|
@ -383,6 +383,24 @@ groups:
|
|
|
|
summary: "Elasticsearch health status is not green. Please Check"
|
|
|
|
summary: "Elasticsearch health status is not green. Please Check"
|
|
|
|
description: "Alert for Elasticsearch health status"
|
|
|
|
description: "Alert for Elasticsearch health status"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
- alert: elasticsearch - usage of active shards greater than 90%
|
|
|
|
|
|
|
|
expr: avg(elasticsearch_cluster_health_active_shards) * 100 / (avg(elasticsearch_cluster_health_number_of_nodes) * {{ elastic_cluster_settings_max_shards }} ) > 90
|
|
|
|
|
|
|
|
for: 30m
|
|
|
|
|
|
|
|
labels:
|
|
|
|
|
|
|
|
severity: warning
|
|
|
|
|
|
|
|
annotations:
|
|
|
|
|
|
|
|
summary: "ES cluster - active shards reaches WARN-threshold... Please clean up"
|
|
|
|
|
|
|
|
description: "WARNING: Alert for ES active shards usage"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
- alert: elasticsearch - usage of active shards greater than 95%
|
|
|
|
|
|
|
|
expr: avg(elasticsearch_cluster_health_active_shards) * 100 / (avg(elasticsearch_cluster_health_number_of_nodes) * {{ elastic_cluster_settings_max_shards }} ) > 95
|
|
|
|
|
|
|
|
for: 5m
|
|
|
|
|
|
|
|
labels:
|
|
|
|
|
|
|
|
severity: critical
|
|
|
|
|
|
|
|
annotations:
|
|
|
|
|
|
|
|
summary: "ES cluster - active shards reaches CRITICAL-threshold... Please clean up"
|
|
|
|
|
|
|
|
description: "WARNING: Alert for ES active shards usage"
|
|
|
|
|
|
|
|
|
|
|
|
- alert: awx job failed with status error
|
|
|
|
- alert: awx job failed with status error
|
|
|
|
expr: changes(awx_status_total{status="error"}[2m]) > 0
|
|
|
|
expr: changes(awx_status_total{status="error"}[2m]) > 0
|
|
|
|
for: 2m
|
|
|
|
for: 2m
|
|
|
|
|