1
0
Fork 0
mirror of https://github.com/arangodb/kube-arangodb.git synced 2024-12-14 11:57:37 +00:00

Add metrics for the current plan actions (#879)

This commit is contained in:
Tomasz Mielech 2022-01-05 12:02:51 +01:00 committed by GitHub
parent f25a7d123c
commit 061d1d7cbb
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
4 changed files with 40 additions and 10 deletions

View file

@ -12,6 +12,7 @@
- Add core containers names to follow their terminations - Add core containers names to follow their terminations
- Add ArangoJob and Apps Operator - Add ArangoJob and Apps Operator
- Use Go 1.17 - Use Go 1.17
- Add metrics for the plan actions
## [1.2.6](https://github.com/arangodb/kube-arangodb/tree/1.2.6) (2021-12-15) ## [1.2.6](https://github.com/arangodb/kube-arangodb/tree/1.2.6) (2021-12-15)
- Add ArangoBackup backoff functionality - Add ArangoBackup backoff functionality

View file

@ -301,6 +301,11 @@ func (a Action) SetImage(image string) Action {
return a return a
} }
// IsStarted returns true if the action has been started already.
func (a Action) IsStarted() bool {
return !a.StartTime.IsZero()
}
// AsPlan parse action list into plan // AsPlan parse action list into plan
func AsPlan(a []Action) Plan { func AsPlan(a []Action) Plan {
return a return a

View file

@ -301,6 +301,11 @@ func (a Action) SetImage(image string) Action {
return a return a
} }
// IsStarted returns true if the action has been started already.
func (a Action) IsStarted() bool {
return !a.StartTime.IsZero()
}
// AsPlan parse action list into plan // AsPlan parse action list into plan
func AsPlan(a []Action) Plan { func AsPlan(a []Action) Plan {
return a return a

View file

@ -17,9 +17,6 @@
// //
// Copyright holder is ArangoDB GmbH, Cologne, Germany // Copyright holder is ArangoDB GmbH, Cologne, Germany
// //
// Author Ewout Prangsma
// Author Tomasz Mielech
//
package reconcile package reconcile
@ -28,22 +25,23 @@ import (
"fmt" "fmt"
"time" "time"
"github.com/arangodb/kube-arangodb/pkg/metrics"
"github.com/arangodb/kube-arangodb/pkg/util/errors"
inspectorInterface "github.com/arangodb/kube-arangodb/pkg/util/k8sutil/inspector"
"github.com/rs/zerolog" "github.com/rs/zerolog"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1" api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1"
"github.com/arangodb/kube-arangodb/pkg/metrics"
"github.com/arangodb/kube-arangodb/pkg/util/errors"
"github.com/arangodb/kube-arangodb/pkg/util/k8sutil" "github.com/arangodb/kube-arangodb/pkg/util/k8sutil"
inspectorInterface "github.com/arangodb/kube-arangodb/pkg/util/k8sutil/inspector"
) )
var ( var (
actionsGeneratedMetrics = metrics.MustRegisterCounterVec(reconciliationComponent, "actions_generated", "Number of actions added to the plan", metrics.DeploymentName, metrics.ActionName, metrics.ActionPriority) actionsGeneratedMetrics = metrics.MustRegisterCounterVec(reconciliationComponent, "actions_generated", "Number of actions added to the plan", metrics.DeploymentName, metrics.ActionName, metrics.ActionPriority)
actionsSucceededMetrics = metrics.MustRegisterCounterVec(reconciliationComponent, "actions_succeeded", "Number of succeeded actions", metrics.DeploymentName, metrics.ActionName, metrics.ActionPriority) actionsSucceededMetrics = metrics.MustRegisterCounterVec(reconciliationComponent, "actions_succeeded", "Number of succeeded actions", metrics.DeploymentName, metrics.ActionName, metrics.ActionPriority)
actionsFailedMetrics = metrics.MustRegisterCounterVec(reconciliationComponent, "actions_failed", "Number of failed actions", metrics.DeploymentName, metrics.ActionName, metrics.ActionPriority) actionsFailedMetrics = metrics.MustRegisterCounterVec(reconciliationComponent, "actions_failed", "Number of failed actions", metrics.DeploymentName, metrics.ActionName, metrics.ActionPriority)
actionsCurrentPlan = metrics.MustRegisterGaugeVec(reconciliationComponent, "actions_current",
"The current number of the plan actions are being performed",
metrics.DeploymentName, "group", "member", "name", "priority")
) )
type planner interface { type planner interface {
@ -179,16 +177,31 @@ func (d *Reconciler) executePlan(ctx context.Context, cachedStatus inspectorInte
done, abort, recall, err := d.executeAction(ctx, log, planAction, action) done, abort, recall, err := d.executeAction(ctx, log, planAction, action)
if err != nil { if err != nil {
// The Plan will be cleaned up, so no actions will be in the queue.
actionsCurrentPlan.WithLabelValues(d.context.GetName(), planAction.Group.AsRole(), planAction.MemberID,
planAction.Type.String(), pg.Type()).Set(0.0)
actionsFailedMetrics.WithLabelValues(d.context.GetName(), planAction.Type.String(), pg.Type()).Inc() actionsFailedMetrics.WithLabelValues(d.context.GetName(), planAction.Type.String(), pg.Type()).Inc()
return nil, false, errors.WithStack(err) return nil, false, errors.WithStack(err)
} }
if abort { if abort {
// The Plan will be cleaned up, so no actions will be in the queue.
actionsCurrentPlan.WithLabelValues(d.context.GetName(), planAction.Group.AsRole(), planAction.MemberID,
planAction.Type.String(), pg.Type()).Set(0.0)
actionsFailedMetrics.WithLabelValues(d.context.GetName(), planAction.Type.String(), pg.Type()).Inc() actionsFailedMetrics.WithLabelValues(d.context.GetName(), planAction.Type.String(), pg.Type()).Inc()
return nil, true, nil return nil, true, nil
} }
if done { if done {
if planAction.IsStarted() {
// The below metrics was increased in the previous iteration, so it should be decreased now.
// If the action hasn't been started in this iteration then the metrics have not been increased.
actionsCurrentPlan.WithLabelValues(d.context.GetName(), planAction.Group.AsRole(), planAction.MemberID,
planAction.Type.String(), pg.Type()).Dec()
}
actionsSucceededMetrics.WithLabelValues(d.context.GetName(), planAction.Type.String(), pg.Type()).Inc() actionsSucceededMetrics.WithLabelValues(d.context.GetName(), planAction.Type.String(), pg.Type()).Inc()
if len(plan) > 1 { if len(plan) > 1 {
plan = plan[1:] plan = plan[1:]
@ -196,6 +209,8 @@ func (d *Reconciler) executePlan(ctx context.Context, cachedStatus inspectorInte
plan[0].MemberID = action.MemberID() plan[0].MemberID = action.MemberID()
} }
} else { } else {
actionsCurrentPlan.WithLabelValues(d.context.GetName(), planAction.Group.AsRole(), planAction.MemberID,
planAction.Type.String(), pg.Type()).Set(0.0)
plan = nil plan = nil
} }
@ -218,7 +233,11 @@ func (d *Reconciler) executePlan(ctx context.Context, cachedStatus inspectorInte
return nil, false, errors.WithStack(err) return nil, false, errors.WithStack(err)
} }
} else { } else {
if plan[0].StartTime.IsZero() { if !plan[0].IsStarted() {
// The action has been started in this iteration, but it is not finished yet.
actionsCurrentPlan.WithLabelValues(d.context.GetName(), planAction.Group.AsRole(), planAction.MemberID,
planAction.Type.String(), pg.Type()).Inc()
now := metav1.Now() now := metav1.Now()
plan[0].StartTime = &now plan[0].StartTime = &now
} }
@ -229,7 +248,7 @@ func (d *Reconciler) executePlan(ctx context.Context, cachedStatus inspectorInte
} }
func (d *Reconciler) executeAction(ctx context.Context, log zerolog.Logger, planAction api.Action, action Action) (done, abort, callAgain bool, err error) { func (d *Reconciler) executeAction(ctx context.Context, log zerolog.Logger, planAction api.Action, action Action) (done, abort, callAgain bool, err error) {
if planAction.StartTime.IsZero() { if !planAction.IsStarted() {
// Not started yet // Not started yet
ready, err := action.Start(ctx) ready, err := action.Start(ctx)
if err != nil { if err != nil {