Add alarms and alarm clusters

Change-Id: I136a4c1d25bdac64f0e3f6a3d19d44eacc5030d6
This commit is contained in:
Ales Komarek 2016-11-10 00:06:05 +01:00 committed by Éric Lemoine
parent 2503d623dd
commit 6b930a588c
1 changed files with 212 additions and 0 deletions

View File

@ -18,3 +18,215 @@ log_collector:
priority: ["^Seq"]
decoder: "cinder_decoder"
splitter: "cinder_splitter"
metric_collector:
trigger:
cinder_logs_error:
description: 'Too many errors have been detected in Cinder logs'
severity: warning
no_data_policy: okay
rules:
- metric: log_messages
field:
service: cinder
level: error
relational_operator: '>'
threshold: 0.1
window: 70
periods: 0
function: max
cinder_api_local_endpoint:
description: 'Cinder API is locally down'
severity: down
rules:
- metric: openstack_check_local_api
field:
service: cinder-api
relational_operator: '=='
threshold: 0
window: 60
periods: 0
function: last
alarm:
cinder_logs:
alerting: enabled
triggers:
- cinder_logs_error
dimension:
service: cinder-logs
cinder_api_endpoint:
alerting: enabled
triggers:
- cinder_api_local_endpoint
dimension:
service: cinder-api-endpoint
remote_collector:
trigger:
cinder_api_check_failed:
description: 'Endpoint check for cinder-api is failed'
severity: down
rules:
- metric: openstack_check_api
field:
service: cinder-api
relational_operator: '=='
threshold: 0
window: 60
periods: 0
function: last
cinder_scheduler_one_down:
description: 'At least one Cinder scheduler is down'
severity: warning
rules:
- metric: openstack_cinder_services
field:
service: scheduler
state: down
relational_operator: '>'
threshold: 0
window: 60
periods: 0
function: last
cinder_scheduler_majority_down:
description: 'Majority of Cinder schedulers are down'
severity: critical
rules:
- metric: openstack_cinder_services
field:
service: scheduler
state: up
relational_operator: '<='
threshold: 50
window: 60
periods: 0
function: last
cinder_scheduler_all_down:
description: 'All Cinder schedulers are down'
severity: down
rules:
- metric: openstack_cinder_services
field:
service: scheduler
state: up
relational_operator: '=='
threshold: 0
window: 60
periods: 0
function: last
cinder_volume_one_down:
description: 'At least one Cinder volume is down'
severity: warning
rules:
- metric: openstack_cinder_services
field:
service: scheduler
state: down
relational_operator: '>'
threshold: 0
window: 60
periods: 0
function: last
cinder_volume_majority_down:
description: 'Majority of Cinder volumes are down'
severity: critical
rules:
- metric: openstack_cinder_services
field:
service: volume
state: up
relational_operator: '<='
threshold: 50
window: 60
periods: 0
function: last
cinder_volume_all_down:
description: 'All Cinder volumes are down'
severity: down
rules:
- metric: openstack_cinder_services
field:
service: volume
state: up
relational_operator: '=='
threshold: 0
window: 60
periods: 0
function: last
alarm:
cinder_api_check:
alerting: true
triggers:
- cinder_api_check_failed
dimension:
service: cinder-api-check
cinder_volume:
alerting: true
triggers:
- cinder_volume_all_down
- cinder_volume_majority_down
- cinder_volume_one_down
dimension:
service: cinder-volume
cinder_scheduler:
alerting: true
triggers:
- cinder_scheduler_all_down
- cinder_scheduler_majority_down
- cinder_scheduler_one_down
dimension:
service: cinder-scheduler
aggregator:
alarm_cluster:
cinder_logs:
policy: highest_severity
group_by: hostname
match:
service: cinder-logs
members:
- cinder_logs
dimension:
service: cinder
cinder_api_endpoint:
policy: availability_of_members
group_by: hostname
match:
service: cinder-api-endpoint
members:
- cinder_api_endpoint
dimension:
service: cinder
cinder_api_check:
policy: highest_severity
match:
service: cinder-api-check
members:
- cinder_api_check
dimension:
service: cinder
cinder_volume:
policy: highest_severity
match:
service: cinder-volume
members:
- cinder_volume
dimension:
service: cinder
cinder_scheduler:
policy: highest_severity
match:
service: cinder-scheduler
members:
- cinder_scheduler
dimension:
service: cinder
cinder:
policy: highest_severity
match:
service: cinder
members:
- cinder_logs
- cinder_api_endpoint
- cinder_api_check
- cinder_volume
- cinder_scheduler
dimension:
cluster_name: cinder