notifier: retry upon failure
This commit is contained in:
parent
3ff8bfaa93
commit
480589a83a
@ -29,6 +29,8 @@ updater:
|
|||||||
# Use 0 to disable the updater entirely.
|
# Use 0 to disable the updater entirely.
|
||||||
interval: 2h
|
interval: 2h
|
||||||
notifier:
|
notifier:
|
||||||
|
# How many attempts will the notifier do when a notifier backend fails.
|
||||||
|
attempts: 3
|
||||||
# Configuration for HTTP notifier
|
# Configuration for HTTP notifier
|
||||||
http:
|
http:
|
||||||
# Endpoint that will receive notifications with POST requests.
|
# Endpoint that will receive notifications with POST requests.
|
||||||
|
@ -44,6 +44,7 @@ type UpdaterConfig struct {
|
|||||||
|
|
||||||
// NotifierConfig is the configuration for the Notifier service and its registered notifiers.
|
// NotifierConfig is the configuration for the Notifier service and its registered notifiers.
|
||||||
type NotifierConfig struct {
|
type NotifierConfig struct {
|
||||||
|
Attempts int
|
||||||
Params map[string]interface{} `yaml:",inline"`
|
Params map[string]interface{} `yaml:",inline"`
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -68,6 +69,9 @@ var DefaultConfig = Config{
|
|||||||
HealthPort: 6061,
|
HealthPort: 6061,
|
||||||
Timeout: 900 * time.Second,
|
Timeout: 900 * time.Second,
|
||||||
},
|
},
|
||||||
|
Notifier: &NotifierConfig{
|
||||||
|
Attempts: 5,
|
||||||
|
},
|
||||||
}
|
}
|
||||||
|
|
||||||
// Load is a shortcut to open a file, read it, and generate a Config.
|
// Load is a shortcut to open a file, read it, and generate a Config.
|
||||||
|
@ -20,6 +20,7 @@ import (
|
|||||||
"time"
|
"time"
|
||||||
|
|
||||||
"github.com/coreos/pkg/capnslog"
|
"github.com/coreos/pkg/capnslog"
|
||||||
|
"github.com/coreos/pkg/timeutil"
|
||||||
"github.com/pborman/uuid"
|
"github.com/pborman/uuid"
|
||||||
|
|
||||||
"github.com/coreos/clair/config"
|
"github.com/coreos/clair/config"
|
||||||
@ -32,9 +33,9 @@ var log = capnslog.NewPackageLogger("github.com/coreos/clair", "notifier")
|
|||||||
|
|
||||||
const (
|
const (
|
||||||
checkInterval = 5 * time.Minute
|
checkInterval = 5 * time.Minute
|
||||||
|
|
||||||
refreshLockDuration = time.Minute * 2
|
refreshLockDuration = time.Minute * 2
|
||||||
lockDuration = time.Minute*8 + refreshLockDuration
|
lockDuration = time.Minute*8 + refreshLockDuration
|
||||||
|
maxBackOff = 15 * time.Minute
|
||||||
)
|
)
|
||||||
|
|
||||||
// TODO(Quentin-M): Allow registering custom notification handlers.
|
// TODO(Quentin-M): Allow registering custom notification handlers.
|
||||||
@ -114,7 +115,7 @@ func Run(config *config.NotifierConfig, stopper *utils.Stopper) {
|
|||||||
// Handle task.
|
// Handle task.
|
||||||
done := make(chan bool, 1)
|
done := make(chan bool, 1)
|
||||||
go func() {
|
go func() {
|
||||||
if handleTask(notification) {
|
if handleTask(notification, stopper, config.Attempts) {
|
||||||
database.MarkNotificationAsSent(node)
|
database.MarkNotificationAsSent(node)
|
||||||
}
|
}
|
||||||
database.Unlock(node, whoAmI)
|
database.Unlock(node, whoAmI)
|
||||||
@ -160,7 +161,7 @@ func findTask(whoAmI string, stopper *utils.Stopper) (string, database.Notificat
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
func handleTask(notification database.Notification) bool {
|
func handleTask(notification database.Notification, st *utils.Stopper, maxAttempts int) bool {
|
||||||
// Get notification content.
|
// Get notification content.
|
||||||
// TODO(Quentin-M): Split big notifications.
|
// TODO(Quentin-M): Split big notifications.
|
||||||
notificationContent, err := notification.GetContent()
|
notificationContent, err := notification.GetContent()
|
||||||
@ -177,12 +178,35 @@ func handleTask(notification database.Notification) bool {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Send notification.
|
// Send notification.
|
||||||
// TODO(Quentin-M): Backoff / MaxRetries
|
|
||||||
for notifierName, notifier := range notifiers {
|
for notifierName, notifier := range notifiers {
|
||||||
if err := notifier.Send(payload); err != nil {
|
var attempts int
|
||||||
log.Errorf("could not send notification '%s' to notifier '%s': %s", notification.GetName(), notifierName, err)
|
var backOff time.Duration
|
||||||
|
for {
|
||||||
|
// Max attempts exceeded.
|
||||||
|
if attempts >= maxAttempts {
|
||||||
|
log.Infof("giving up on sending notification '%s' to notifier '%s': max attempts exceeded (%d)\n", notification.GetName(), notifierName, maxAttempts)
|
||||||
return false
|
return false
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Backoff.
|
||||||
|
if backOff > 0 {
|
||||||
|
log.Infof("waiting %v before retrying to send notification '%s' to notifier '%s' (Attempt %d / %d)\n", backOff, notification.GetName(), notifierName, attempts+1, maxAttempts)
|
||||||
|
if !st.Sleep(backOff) {
|
||||||
|
return false
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Send using the current notifier.
|
||||||
|
if err := notifier.Send(payload); err == nil {
|
||||||
|
// Send has been successful. Go to the next one.
|
||||||
|
break
|
||||||
|
}
|
||||||
|
|
||||||
|
// Send failed; increase attempts/backoff and retry.
|
||||||
|
log.Errorf("could not send notification '%s' to notifier '%s': %s", notification.GetName(), notifierName, err)
|
||||||
|
backOff = timeutil.ExpBackoff(backOff, maxBackOff)
|
||||||
|
attempts++
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
log.Infof("successfully sent notification '%s'\n", notification.GetName())
|
log.Infof("successfully sent notification '%s'\n", notification.GetName())
|
||||||
|
Loading…
Reference in New Issue
Block a user