2020-09-19 20:22:12 +00:00
package watchdog
2020-09-16 23:26:19 +00:00
import (
2021-12-03 03:15:51 +00:00
"errors"
2020-11-13 20:01:21 +00:00
"log"
2021-12-03 03:15:51 +00:00
"os"
2020-11-13 20:01:21 +00:00
2022-12-06 06:41:09 +00:00
"github.com/TwiN/gatus/v5/alerting"
"github.com/TwiN/gatus/v5/core"
2020-09-16 23:26:19 +00:00
)
2020-09-19 20:22:12 +00:00
// HandleAlerting takes care of alerts to resolve and alerts to trigger based on result success or failure
2021-10-23 20:47:12 +00:00
func HandleAlerting ( endpoint * core . Endpoint , result * core . Result , alertingConfig * alerting . Config , debug bool ) {
2021-05-19 02:29:15 +00:00
if alertingConfig == nil {
2020-09-16 23:26:19 +00:00
return
}
if result . Success {
2021-10-23 20:47:12 +00:00
handleAlertsToResolve ( endpoint , result , alertingConfig , debug )
2020-09-16 23:26:19 +00:00
} else {
2021-10-23 20:47:12 +00:00
handleAlertsToTrigger ( endpoint , result , alertingConfig , debug )
2020-09-16 23:26:19 +00:00
}
}
2021-10-23 20:47:12 +00:00
func handleAlertsToTrigger ( endpoint * core . Endpoint , result * core . Result , alertingConfig * alerting . Config , debug bool ) {
endpoint . NumberOfSuccessesInARow = 0
endpoint . NumberOfFailuresInARow ++
for _ , endpointAlert := range endpoint . Alerts {
// If the alert hasn't been triggered, move to the next one
if ! endpointAlert . IsEnabled ( ) || endpointAlert . FailureThreshold > endpoint . NumberOfFailuresInARow {
2020-09-16 23:26:19 +00:00
continue
}
2021-10-23 20:47:12 +00:00
if endpointAlert . Triggered {
2021-05-19 02:29:15 +00:00
if debug {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToTrigger] Alert for endpoint=%s with description='%s' has already been TRIGGERED, skipping" , endpoint . Name , endpointAlert . GetDescription ( ) )
2020-09-16 23:26:19 +00:00
}
continue
}
2021-10-23 20:47:12 +00:00
alertProvider := alertingConfig . GetAlertingProviderByAlertType ( endpointAlert . Type )
2022-12-16 01:54:38 +00:00
if alertProvider != nil {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToTrigger] Sending %s alert because alert for endpoint=%s with description='%s' has been TRIGGERED" , endpointAlert . Type , endpoint . Name , endpointAlert . GetDescription ( ) )
2021-12-03 03:15:51 +00:00
var err error
if os . Getenv ( "MOCK_ALERT_PROVIDER" ) == "true" {
if os . Getenv ( "MOCK_ALERT_PROVIDER_ERROR" ) == "true" {
err = errors . New ( "error" )
}
} else {
err = alertProvider . Send ( endpoint , endpointAlert , result , false )
}
2020-09-16 23:26:19 +00:00
if err != nil {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToTrigger] Failed to send an alert for endpoint=%s: %s" , endpoint . Name , err . Error ( ) )
2020-09-16 23:26:19 +00:00
} else {
2021-10-23 20:47:12 +00:00
endpointAlert . Triggered = true
2020-09-16 23:26:19 +00:00
}
2020-09-26 18:23:43 +00:00
} else {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToResolve] Not sending alert of type=%s despite being TRIGGERED, because the provider wasn't configured properly" , endpointAlert . Type )
2020-09-16 23:26:19 +00:00
}
}
}
2021-10-23 20:47:12 +00:00
func handleAlertsToResolve ( endpoint * core . Endpoint , result * core . Result , alertingConfig * alerting . Config , debug bool ) {
endpoint . NumberOfSuccessesInARow ++
for _ , endpointAlert := range endpoint . Alerts {
if ! endpointAlert . IsEnabled ( ) || ! endpointAlert . Triggered || endpointAlert . SuccessThreshold > endpoint . NumberOfSuccessesInARow {
2020-09-16 23:26:19 +00:00
continue
}
2021-10-23 20:47:12 +00:00
// Even if the alert provider returns an error, we still set the alert's Triggered variable to false.
2021-01-21 21:14:32 +00:00
// Further explanation can be found on Alert's Triggered field.
2021-10-23 20:47:12 +00:00
endpointAlert . Triggered = false
if ! endpointAlert . IsSendingOnResolved ( ) {
2020-09-16 23:26:19 +00:00
continue
}
2021-10-23 20:47:12 +00:00
alertProvider := alertingConfig . GetAlertingProviderByAlertType ( endpointAlert . Type )
2022-12-16 01:54:38 +00:00
if alertProvider != nil {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToResolve] Sending %s alert because alert for endpoint=%s with description='%s' has been RESOLVED" , endpointAlert . Type , endpoint . Name , endpointAlert . GetDescription ( ) )
2021-12-03 02:05:17 +00:00
err := alertProvider . Send ( endpoint , endpointAlert , result , true )
2020-09-16 23:26:19 +00:00
if err != nil {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToResolve] Failed to send an alert for endpoint=%s: %s" , endpoint . Name , err . Error ( ) )
2020-09-16 23:26:19 +00:00
}
2020-09-26 18:23:43 +00:00
} else {
2021-10-23 20:47:12 +00:00
log . Printf ( "[watchdog][handleAlertsToResolve] Not sending alert of type=%s despite being RESOLVED, because the provider wasn't configured properly" , endpointAlert . Type )
2020-09-16 23:26:19 +00:00
}
}
2021-10-23 20:47:12 +00:00
endpoint . NumberOfFailuresInARow = 0
2020-09-16 23:26:19 +00:00
}