2018-03-15 15:33:28 +00:00
|
|
|
//
|
|
|
|
// DISCLAIMER
|
|
|
|
//
|
|
|
|
// Copyright 2018 ArangoDB GmbH, Cologne, Germany
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
//
|
|
|
|
// Copyright holder is ArangoDB GmbH, Cologne, Germany
|
|
|
|
//
|
|
|
|
// Author Ewout Prangsma
|
|
|
|
//
|
|
|
|
|
|
|
|
package deployment
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"time"
|
|
|
|
|
2018-03-27 10:11:57 +00:00
|
|
|
api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1alpha"
|
2018-03-15 15:33:28 +00:00
|
|
|
"github.com/arangodb/kube-arangodb/pkg/util/k8sutil"
|
2018-04-03 15:43:42 +00:00
|
|
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
2018-03-15 15:33:28 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
// inspectDeployment inspects the entire deployment, creates
|
|
|
|
// a plan to update if needed and inspects underlying resources.
|
|
|
|
// This function should be called when:
|
|
|
|
// - the deployment has changed
|
|
|
|
// - any of the underlying resources has changed
|
|
|
|
// - once in a while
|
|
|
|
// Returns the delay until this function should be called again.
|
|
|
|
func (d *Deployment) inspectDeployment(lastInterval time.Duration) time.Duration {
|
2018-03-27 10:11:57 +00:00
|
|
|
log := d.deps.Log
|
2018-03-15 15:33:28 +00:00
|
|
|
|
|
|
|
nextInterval := lastInterval
|
|
|
|
hasError := false
|
|
|
|
ctx := context.Background()
|
|
|
|
|
2018-04-03 15:43:42 +00:00
|
|
|
// Check deployment still exists
|
|
|
|
if _, err := d.deps.DatabaseCRCli.DatabaseV1alpha().ArangoDeployments(d.apiObject.GetNamespace()).Get(d.apiObject.GetName(), metav1.GetOptions{}); k8sutil.IsNotFound(err) {
|
|
|
|
// Deployment is gone
|
|
|
|
log.Info().Msg("Deployment is gone")
|
|
|
|
d.Delete()
|
|
|
|
return nextInterval
|
|
|
|
}
|
|
|
|
|
2018-03-27 10:11:57 +00:00
|
|
|
// Is the deployment in failed state, if so, give up.
|
2018-03-27 16:33:21 +00:00
|
|
|
if d.status.Phase == api.DeploymentPhaseFailed {
|
2018-03-27 10:11:57 +00:00
|
|
|
log.Debug().Msg("Deployment is in Failed state.")
|
|
|
|
return nextInterval
|
|
|
|
}
|
|
|
|
|
|
|
|
// Inspect secret hashes
|
|
|
|
if err := d.resources.ValidateSecretHashes(); err != nil {
|
|
|
|
hasError = true
|
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Secret hash validation failed", err, d.apiObject))
|
|
|
|
}
|
|
|
|
|
|
|
|
// Is the deployment in a good state?
|
|
|
|
if d.status.Conditions.IsTrue(api.ConditionTypeSecretsChanged) {
|
|
|
|
log.Debug().Msg("Condition SecretsChanged is true. Revert secrets before we can continue")
|
|
|
|
return nextInterval
|
|
|
|
}
|
|
|
|
|
2018-03-20 12:10:52 +00:00
|
|
|
// Ensure we have image info
|
|
|
|
if retrySoon, err := d.ensureImages(d.apiObject); err != nil {
|
|
|
|
hasError = true
|
2018-03-23 13:35:58 +00:00
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Image detection failed", err, d.apiObject))
|
2018-03-20 12:10:52 +00:00
|
|
|
} else if retrySoon {
|
|
|
|
nextInterval = minInspectionInterval
|
|
|
|
}
|
|
|
|
|
2018-03-15 15:33:28 +00:00
|
|
|
// Inspection of generated resources needed
|
2018-05-11 08:07:00 +00:00
|
|
|
if err := d.resources.InspectPods(ctx); err != nil {
|
2018-03-15 15:33:28 +00:00
|
|
|
hasError = true
|
2018-03-23 13:35:58 +00:00
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Pod inspection failed", err, d.apiObject))
|
2018-03-15 15:33:28 +00:00
|
|
|
}
|
2018-05-11 14:56:20 +00:00
|
|
|
if err := d.resources.InspectPVCs(ctx); err != nil {
|
|
|
|
hasError = true
|
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("PVC inspection failed", err, d.apiObject))
|
|
|
|
}
|
2018-03-15 15:33:28 +00:00
|
|
|
|
2018-03-29 09:56:57 +00:00
|
|
|
// Check members for resilience
|
|
|
|
if err := d.resilience.CheckMemberFailure(); err != nil {
|
|
|
|
hasError = true
|
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Member failure detection failed", err, d.apiObject))
|
|
|
|
}
|
|
|
|
|
2018-03-15 15:33:28 +00:00
|
|
|
// Create scale/update plan
|
2018-03-23 11:15:22 +00:00
|
|
|
if err := d.reconciler.CreatePlan(); err != nil {
|
2018-03-15 15:33:28 +00:00
|
|
|
hasError = true
|
2018-03-23 13:35:58 +00:00
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Plan creation failed", err, d.apiObject))
|
2018-03-15 15:33:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Execute current step of scale/update plan
|
2018-03-23 11:15:22 +00:00
|
|
|
retrySoon, err := d.reconciler.ExecutePlan(ctx)
|
2018-03-15 15:33:28 +00:00
|
|
|
if err != nil {
|
|
|
|
hasError = true
|
2018-03-23 13:35:58 +00:00
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Plan execution failed", err, d.apiObject))
|
2018-03-15 15:33:28 +00:00
|
|
|
}
|
|
|
|
if retrySoon {
|
|
|
|
nextInterval = minInspectionInterval
|
|
|
|
}
|
|
|
|
|
|
|
|
// Ensure all resources are created
|
2018-05-08 09:34:16 +00:00
|
|
|
if err := d.resources.EnsureSecrets(); err != nil {
|
|
|
|
hasError = true
|
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Secret creation failed", err, d.apiObject))
|
|
|
|
}
|
2018-03-23 14:01:56 +00:00
|
|
|
if err := d.resources.EnsureServices(); err != nil {
|
|
|
|
hasError = true
|
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Service creation failed", err, d.apiObject))
|
|
|
|
}
|
|
|
|
if err := d.resources.EnsurePVCs(); err != nil {
|
2018-03-15 15:33:28 +00:00
|
|
|
hasError = true
|
2018-03-23 13:35:58 +00:00
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("PVC creation failed", err, d.apiObject))
|
2018-03-15 15:33:28 +00:00
|
|
|
}
|
2018-03-23 13:35:58 +00:00
|
|
|
if err := d.resources.EnsurePods(); err != nil {
|
2018-03-15 15:33:28 +00:00
|
|
|
hasError = true
|
2018-03-23 13:35:58 +00:00
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Pod creation failed", err, d.apiObject))
|
2018-03-15 15:33:28 +00:00
|
|
|
}
|
|
|
|
|
2018-03-26 11:35:00 +00:00
|
|
|
// At the end of the inspect, we cleanup terminated pods.
|
|
|
|
if d.resources.CleanupTerminatedPods(); err != nil {
|
|
|
|
hasError = true
|
|
|
|
d.CreateEvent(k8sutil.NewErrorEvent("Pod cleanup failed", err, d.apiObject))
|
|
|
|
}
|
|
|
|
|
2018-03-15 15:33:28 +00:00
|
|
|
// Update next interval (on errors)
|
|
|
|
if hasError {
|
|
|
|
if d.recentInspectionErrors == 0 {
|
|
|
|
nextInterval = minInspectionInterval
|
|
|
|
d.recentInspectionErrors++
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
d.recentInspectionErrors = 0
|
|
|
|
}
|
|
|
|
if nextInterval > maxInspectionInterval {
|
|
|
|
nextInterval = maxInspectionInterval
|
|
|
|
}
|
|
|
|
return nextInterval
|
|
|
|
}
|
2018-03-23 14:36:10 +00:00
|
|
|
|
|
|
|
// triggerInspection ensures that an inspection is run soon.
|
|
|
|
func (d *Deployment) triggerInspection() {
|
|
|
|
d.inspectTrigger.Trigger()
|
|
|
|
}
|