Lately we have been noticing that the "first_notification_delay" config is no longer working correctly for some services.
We have several services set up to send out notifications, these all inherit settings from the same service template.
On the service template we have first_notification_delay set to 5 minutes, to avoid false alerts.
However lately we have been noticing this doesn't work correctly for some (not all) services.
Here is the config of a service for which no notification delay happens:
Code: Select all
define service {
host_name host_A
service_description service_A
use template_customer_A
register 1
}Code: Select all
define service {
name template_customer_A
service_description Customer A CRITITCAL Service through Satellite Nagios
use ALG_generic-service-satnag
notification_period SHR_24x7
contacts Jira_24-7
contact_groups customerA-oncall
register 0
}Code: Select all
define service {
name ALG_generic-service-satnag
service_description Hosting base template for services via a satelllite Nagios
use ALG_generic-service-active
check_command check_dummy!0!"No data received yet."
initial_state u
max_check_attempts 1
active_checks_enabled 0
passive_checks_enabled 1
register 0
}Code: Select all
define service {
name ALG_generic-service-active
service_description Hosting base template for active service
is_volatile 0
initial_state u
max_check_attempts 3
check_interval 5
retry_interval 1
active_checks_enabled 1
passive_checks_enabled 1
check_period SHR_24x7
obsess_over_service 1
check_freshness 0
event_handler_enabled 1
flap_detection_enabled 1
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 1
notification_interval 120
first_notification_delay 5
notification_period SHR_workhours_extend
notification_options w,c,r,
notifications_enabled 1
contacts slack
register 0
}Contact definitions:
Code: Select all
define contactgroup {
contactgroup_name customerA-oncall
alias Customer A OnCall
members Customer A oncall,support
}
define contact {
contact_name Customer A oncall
alias Customer A oncall
host_notifications_enabled 1
service_notifications_enabled 1
host_notification_period SHR_24x7
service_notification_period SHR_24x7
host_notification_options d,r,
service_notification_options w,c,r,
host_notification_commands notify-host-by-email,notify-host-by-slack,notify-host-by-text
service_notification_commands notify-service-by-email,notify-service-by-slack,notify-service-by-text
can_submit_commands 0
email [email protected]
address1 xxxxxxxxxxxx
}Another service which has almost identical config, first notification delay seems to be respected:
Code: Select all
define service {
host_name host_B
service_description service B
use template_customer_B
register 1
}Code: Select all
define service {
name template_customer_B
service_description Customer B CRITITCAL Service through Satellite Nagios
use ALG_generic-service-satnag
max_check_attempts 1
flap_detection_enabled 0
notification_period SHR_24x7
contacts Jira_24-7
contact_groups CustomerB-oncall
register 0
}Contact definition is also very similar
Code: Select all
define contactgroup {
contactgroup_name CustomerB-oncall
alias Customer B OnCall
members Customer B OnCall,support
}
define contact {
contact_name Customer B OnCall
alias Customer B OnCall
host_notifications_enabled 1
service_notifications_enabled 1
host_notification_period SHR_24x7
service_notification_period SHR_24x7
host_notification_options d,r,
service_notification_options w,c,r,
host_notification_commands notify-host-by-email,notify-host-by-slack,notify-host-by-text
service_notification_commands notify-service-by-email,notify-service-by-slack,notify-service-by-text
can_submit_commands 0
email [email protected]
address1 xxxxxxxxxx
}Any ideas on troubleshooting this issue?
Thanks