1
0
Fork 0
mirror of https://github.com/arangodb/kube-arangodb.git synced 2024-12-14 11:57:37 +00:00

[Bugfix] Fix Maintenance grace period (#961)

This commit is contained in:
Adam Janikowski 2022-04-25 13:56:04 +02:00 committed by GitHub
parent f2776d7dc6
commit 83a80177b9
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
12 changed files with 251 additions and 83 deletions

View file

@ -11,6 +11,7 @@
- (Bugfix) Disable member removal in case of health failure - (Bugfix) Disable member removal in case of health failure
- (Bugfix) Reorder Topology management plan steps - (Bugfix) Reorder Topology management plan steps
- (Feature) UpdateInProgress & UpgradeInProgress Conditions - (Feature) UpdateInProgress & UpgradeInProgress Conditions
- (Bugfix) Fix Maintenance switch and HotBackup race
## [1.2.9](https://github.com/arangodb/kube-arangodb/tree/1.2.9) (2022-03-30) ## [1.2.9](https://github.com/arangodb/kube-arangodb/tree/1.2.9) (2022-03-30)
- (Feature) Improve Kubernetes clientsets management - (Feature) Improve Kubernetes clientsets management

View file

@ -27,7 +27,6 @@ import (
"github.com/arangodb/go-driver" "github.com/arangodb/go-driver"
"github.com/arangodb/go-driver/agency" "github.com/arangodb/go-driver/agency"
"github.com/arangodb/kube-arangodb/pkg/util"
"github.com/arangodb/kube-arangodb/pkg/util/errors" "github.com/arangodb/kube-arangodb/pkg/util/errors"
) )
@ -111,35 +110,7 @@ type StatePlan struct {
} }
type StateSupervision struct { type StateSupervision struct {
Maintenance StateExists `json:"Maintenance,omitempty"` Maintenance StateTimestamp `json:"Maintenance,omitempty"`
}
type StateExists []byte
func (d StateExists) Hash() string {
if d == nil {
return ""
}
return util.SHA256(d)
}
func (d StateExists) Exists() bool {
return d != nil
}
func (d *StateExists) UnmarshalJSON(bytes []byte) error {
if bytes == nil {
*d = nil
return nil
}
z := make([]byte, len(bytes))
copy(z, bytes)
*d = z
return nil
} }
func (s State) CountShards() int { func (s State) CountShards() int {

View file

@ -0,0 +1,51 @@
//
// DISCLAIMER
//
// Copyright 2016-2022 ArangoDB GmbH, Cologne, Germany
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// Copyright holder is ArangoDB GmbH, Cologne, Germany
//
package agency
import "github.com/arangodb/kube-arangodb/pkg/util"
type StateExists []byte
func (d StateExists) Hash() string {
if d == nil {
return ""
}
return util.SHA256(d)
}
func (d StateExists) Exists() bool {
return d != nil
}
func (d *StateExists) UnmarshalJSON(bytes []byte) error {
if bytes == nil {
*d = nil
return nil
}
z := make([]byte, len(bytes))
copy(z, bytes)
*d = z
return nil
}

View file

@ -0,0 +1,101 @@
//
// DISCLAIMER
//
// Copyright 2016-2022 ArangoDB GmbH, Cologne, Germany
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// Copyright holder is ArangoDB GmbH, Cologne, Germany
//
package agency
import (
"encoding/json"
"time"
"github.com/arangodb/kube-arangodb/pkg/util"
"github.com/arangodb/kube-arangodb/pkg/util/errors"
)
type StateTimestamp struct {
hash string
data string
time time.Time
parsed bool
exists bool
}
func (s *StateTimestamp) Hash() string {
if s == nil {
return util.SHA256FromString("")
}
return s.hash
}
func (s *StateTimestamp) Exists() bool {
if s == nil {
return false
}
return s.exists
}
func (s *StateTimestamp) Time() (time.Time, bool) {
if s == nil {
return time.Time{}, false
}
if !s.parsed || !s.exists {
return time.Time{}, false
}
return s.time, true
}
func (s *StateTimestamp) UnmarshalJSON(bytes []byte) error {
if s == nil {
return errors.Newf("Object is nil")
}
var t string
if err := json.Unmarshal(bytes, &t); err != nil {
return err
}
*s = unmarshalJSONStateTimestamp(t)
return nil
}
func unmarshalJSONStateTimestamp(s string) StateTimestamp {
var ts = StateTimestamp{
hash: util.SHA256([]byte(s)),
data: s,
exists: true,
}
t, ok := util.ParseAgencyTime(s)
if !ok {
ts.parsed = false
return ts
}
ts.time = t
ts.parsed = true
ts.hash = util.SHA256FromString(s)
return ts
}

View file

@ -25,5 +25,5 @@ type StateTarget struct {
} }
type StateTargetHotBackup struct { type StateTargetHotBackup struct {
Create StateExists `json:"Create,omitempty"` Create StateTimestamp `json:"Create,omitempty"`
} }

View file

@ -33,6 +33,8 @@ func Test_Target_HotBackup(t *testing.T) {
require.NoError(t, json.Unmarshal(agencyDump39HotBackup, &s)) require.NoError(t, json.Unmarshal(agencyDump39HotBackup, &s))
require.True(t, s.Agency.Arango.Target.HotBackup.Create.Exists()) require.True(t, s.Agency.Arango.Target.HotBackup.Create.Exists())
t.Log(s.Agency.Arango.Target.HotBackup.Create.time.String())
}) })
t.Run("Does Not Exists", func(t *testing.T) { t.Run("Does Not Exists", func(t *testing.T) {
var s DumpState var s DumpState

View file

@ -404,25 +404,35 @@ func (d *Deployment) refreshMaintenanceTTL(ctx context.Context) {
return return
} }
condition, ok := d.status.last.Conditions.Get(api.ConditionTypeMaintenanceMode) agencyState, agencyOK := d.GetAgencyCache()
if !agencyOK {
return
}
condition, ok := d.status.last.Conditions.Get(api.ConditionTypeMaintenance)
maintenance := agencyState.Supervision.Maintenance
if !ok || !condition.IsTrue() { if !ok || !condition.IsTrue() {
return return
} }
// Check GracePeriod // Check GracePeriod
if t, ok := maintenance.Time(); ok {
if time.Until(t) < d.apiObject.Spec.Timeouts.GetMaintenanceGracePeriod() {
if err := d.SetAgencyMaintenanceMode(ctx, true); err != nil {
return
}
d.deps.Log.Info().Msgf("Refreshed maintenance lock")
}
} else {
if condition.LastUpdateTime.Add(d.apiObject.Spec.Timeouts.GetMaintenanceGracePeriod()).Before(time.Now()) { if condition.LastUpdateTime.Add(d.apiObject.Spec.Timeouts.GetMaintenanceGracePeriod()).Before(time.Now()) {
if err := d.SetAgencyMaintenanceMode(ctx, true); err != nil { if err := d.SetAgencyMaintenanceMode(ctx, true); err != nil {
return return
} }
if err := d.WithStatusUpdate(ctx, func(s *api.DeploymentStatus) bool {
return s.Conditions.Touch(api.ConditionTypeMaintenanceMode)
}); err != nil {
return
}
d.deps.Log.Info().Msgf("Refreshed maintenance lock") d.deps.Log.Info().Msgf("Refreshed maintenance lock")
} }
} }
}
func (d *Deployment) ensureResources(ctx context.Context, lastInterval util.Interval, cachedStatus inspectorInterface.Inspector) (util.Interval, error) { func (d *Deployment) ensureResources(ctx context.Context, lastInterval util.Interval, cachedStatus inspectorInterface.Inspector) (util.Interval, error) {
// Ensure all resources are created // Ensure all resources are created

View file

@ -21,8 +21,6 @@
package reconcile package reconcile
import ( import (
"context"
api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1" api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1"
"github.com/rs/zerolog" "github.com/rs/zerolog"
) )
@ -34,7 +32,7 @@ func init() {
func newSetMaintenanceConditionAction(log zerolog.Logger, action api.Action, actionCtx ActionContext) Action { func newSetMaintenanceConditionAction(log zerolog.Logger, action api.Action, actionCtx ActionContext) Action {
a := &actionSetMaintenanceCondition{} a := &actionSetMaintenanceCondition{}
a.actionImpl = newActionImpl(log, action, actionCtx, &a.newMemberID) a.actionImpl = newActionImplDefRef(log, action, actionCtx)
return a return a
} }
@ -43,33 +41,5 @@ type actionSetMaintenanceCondition struct {
// actionImpl implement timeout and member id functions // actionImpl implement timeout and member id functions
actionImpl actionImpl
actionEmptyCheckProgress actionEmpty
newMemberID string
}
func (a *actionSetMaintenanceCondition) Start(ctx context.Context) (bool, error) {
switch a.actionCtx.GetMode() {
case api.DeploymentModeSingle:
return true, nil
}
agencyState, agencyOK := a.actionCtx.GetAgencyCache()
if !agencyOK {
a.log.Error().Msgf("Unable to determine maintenance condition")
} else {
if err := a.actionCtx.WithStatusUpdate(ctx, func(s *api.DeploymentStatus) bool {
if agencyState.Supervision.Maintenance.Exists() {
return s.Conditions.Update(api.ConditionTypeMaintenanceMode, true, "Maintenance", "Maintenance enabled")
} else {
return s.Conditions.Remove(api.ConditionTypeMaintenanceMode)
}
}); err != nil {
a.log.Error().Err(err).Msgf("Unable to set maintenance condition")
return true, nil
}
}
return true, nil
} }

View file

@ -39,8 +39,7 @@ func withMaintenanceStart(plan ...api.Action) api.Plan {
} }
return api.AsPlan(plan).Before( return api.AsPlan(plan).Before(
actions.NewClusterAction(api.ActionTypeEnableMaintenance, "Enable maintenance before actions"), actions.NewClusterAction(api.ActionTypeEnableMaintenance, "Enable maintenance before actions"))
actions.NewClusterAction(api.ActionTypeSetMaintenanceCondition, "Enable maintenance before actions"))
} }
func withResignLeadership(group api.ServerGroup, member api.MemberStatus, reason string, plan ...api.Action) api.Plan { func withResignLeadership(group api.ServerGroup, member api.MemberStatus, reason string, plan ...api.Action) api.Plan {

View file

@ -23,6 +23,8 @@ package reconcile
import ( import (
"context" "context"
"time"
api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1" api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1"
"github.com/arangodb/kube-arangodb/pkg/deployment/actions" "github.com/arangodb/kube-arangodb/pkg/deployment/actions"
"github.com/arangodb/kube-arangodb/pkg/deployment/features" "github.com/arangodb/kube-arangodb/pkg/deployment/features"
@ -31,6 +33,27 @@ import (
"github.com/rs/zerolog" "github.com/rs/zerolog"
) )
var (
ObsoleteClusterConditions = []api.ConditionType{
api.ConditionTypeMaintenanceMode,
}
)
func cleanupConditions(ctx context.Context,
log zerolog.Logger, apiObject k8sutil.APIObject,
spec api.DeploymentSpec, status api.DeploymentStatus,
cachedStatus inspectorInterface.Inspector, planCtx PlanBuilderContext) api.Plan {
var p api.Plan
for _, c := range ObsoleteClusterConditions {
if _, ok := status.Conditions.Get(c); ok {
p = append(p, removeConditionActionV2("Cleanup Condition", c))
}
}
return p
}
func createMaintenanceManagementPlan(ctx context.Context, func createMaintenanceManagementPlan(ctx context.Context,
log zerolog.Logger, apiObject k8sutil.APIObject, log zerolog.Logger, apiObject k8sutil.APIObject,
spec api.DeploymentSpec, status api.DeploymentStatus, spec api.DeploymentSpec, status api.DeploymentStatus,
@ -50,22 +73,37 @@ func createMaintenanceManagementPlan(ctx context.Context,
return nil return nil
} }
if agencyState.Target.HotBackup.Create.Exists() {
log.Info().Msgf("HotBackup in progress")
return nil
}
enabled := agencyState.Supervision.Maintenance.Exists() enabled := agencyState.Supervision.Maintenance.Exists()
c, cok := status.Conditions.Get(api.ConditionTypeMaintenance)
if (cok && c.IsTrue()) != enabled {
// Condition not yet propagated
log.Info().Msgf("Condition not yet propagated")
return nil
}
if cok {
if t := c.LastTransitionTime.Time; !t.IsZero() {
if time.Since(t) < 5*time.Second {
// Did not elapse 5 s
return nil
}
}
}
if !enabled && spec.Database.GetMaintenance() { if !enabled && spec.Database.GetMaintenance() {
log.Info().Msgf("Enabling maintenance mode") log.Info().Msgf("Enabling maintenance mode")
return api.Plan{actions.NewClusterAction(api.ActionTypeEnableMaintenance), actions.NewClusterAction(api.ActionTypeSetMaintenanceCondition)} return api.Plan{actions.NewClusterAction(api.ActionTypeEnableMaintenance)}
} }
if enabled && !spec.Database.GetMaintenance() { if enabled && !spec.Database.GetMaintenance() {
log.Info().Msgf("Disabling maintenance mode") log.Info().Msgf("Disabling maintenance mode")
return api.Plan{actions.NewClusterAction(api.ActionTypeDisableMaintenance), actions.NewClusterAction(api.ActionTypeSetMaintenanceCondition)} return api.Plan{actions.NewClusterAction(api.ActionTypeDisableMaintenance)}
}
condition, ok := status.Conditions.Get(api.ConditionTypeMaintenanceMode)
if enabled != (ok && condition.IsTrue()) {
return api.Plan{actions.NewClusterAction(api.ActionTypeSetMaintenanceCondition)}
} }
return nil return nil

View file

@ -60,7 +60,8 @@ func createHighPlan(ctx context.Context, log zerolog.Logger, apiObject k8sutil.A
ApplyIfEmpty(createRebalancerCheckPlan). ApplyIfEmpty(createRebalancerCheckPlan).
ApplyWithBackOff(BackOffCheck, time.Minute, emptyPlanBuilder)). ApplyWithBackOff(BackOffCheck, time.Minute, emptyPlanBuilder)).
Apply(createBackupInProgressConditionPlan). // Discover backups always Apply(createBackupInProgressConditionPlan). // Discover backups always
Apply(createMaintenanceConditionPlan) // Discover maintenance always Apply(createMaintenanceConditionPlan). // Discover maintenance always
Apply(cleanupConditions) // Cleanup Conditions
return r.Plan(), r.BackOff(), true return r.Plan(), r.BackOff(), true
} }

View file

@ -23,6 +23,8 @@ package util
import ( import (
"math" "math"
"time"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
) )
@ -41,3 +43,25 @@ func TimeCompareEqualPointer(a, b *metav1.Time) bool {
return TimeCompareEqual(*a, *b) return TimeCompareEqual(*a, *b)
} }
func TimeAgencyLayouts() []string {
return []string{
time.RFC3339,
}
}
func ParseAgencyTime(s string) (time.Time, bool) {
t, id := ParseTime(s, TimeAgencyLayouts()...)
return t, id != -1
}
func ParseTime(s string, layouts ...string) (time.Time, int) {
for id, layout := range layouts {
if t, err := time.Parse(layout, s); err == nil {
return t, id
}
}
return time.Time{}, -1
}