|
|
|
|
@ -19,10 +19,10 @@ package controllers
|
|
|
|
|
import (
|
|
|
|
|
"context"
|
|
|
|
|
"reflect"
|
|
|
|
|
"sort"
|
|
|
|
|
"time"
|
|
|
|
|
|
|
|
|
|
appsv1 "k8s.io/api/apps/v1"
|
|
|
|
|
"k8s.io/apimachinery/pkg/api/errors"
|
|
|
|
|
"k8s.io/apimachinery/pkg/types"
|
|
|
|
|
|
|
|
|
|
"k8s.io/apimachinery/pkg/runtime"
|
|
|
|
|
@ -99,27 +99,15 @@ func (r *RunnerSetReconciler) Reconcile(ctx context.Context, req ctrl.Request) (
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
liveStatefulSet := &appsv1.StatefulSet{}
|
|
|
|
|
if err := r.Get(ctx, types.NamespacedName{Namespace: runnerSet.Namespace, Name: runnerSet.Name}, liveStatefulSet); err != nil {
|
|
|
|
|
if !errors.IsNotFound(err) {
|
|
|
|
|
log.Error(err, "Failed to get live statefulset")
|
|
|
|
|
|
|
|
|
|
var statefulsetList appsv1.StatefulSetList
|
|
|
|
|
if err := r.List(ctx, &statefulsetList, client.InNamespace(req.Namespace), client.MatchingFields{runnerSetOwnerKey: req.Name}); err != nil {
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if err := r.Client.Create(ctx, desiredStatefulSet); err != nil {
|
|
|
|
|
log.Error(err, "Failed to create statefulset resource")
|
|
|
|
|
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
liveTemplateHash, ok := getStatefulSetTemplateHash(liveStatefulSet)
|
|
|
|
|
if !ok {
|
|
|
|
|
log.Info("Failed to get template hash of newest statefulset resource. It must be in an invalid state. Please manually delete the statefulset so that it is recreated")
|
|
|
|
|
statefulsets := statefulsetList.Items
|
|
|
|
|
|
|
|
|
|
if len(statefulsets) > 1000 {
|
|
|
|
|
log.Info("Postponed reconcilation to prevent potential infinite loop. If you're really scaling more than 1000 statefulsets, do change this hard-coded threshold!")
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@ -130,15 +118,21 @@ func (r *RunnerSetReconciler) Reconcile(ctx context.Context, req ctrl.Request) (
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if liveTemplateHash != desiredTemplateHash {
|
|
|
|
|
copy := liveStatefulSet.DeepCopy()
|
|
|
|
|
copy.Spec = desiredStatefulSet.Spec
|
|
|
|
|
statefulsetsPerTemplateHash := map[string][]*podsForStatefulset{}
|
|
|
|
|
|
|
|
|
|
if err := r.Client.Patch(ctx, copy, client.MergeFrom(liveStatefulSet)); err != nil {
|
|
|
|
|
log.Error(err, "Failed to patch statefulset", "reason", errors.ReasonForError(err))
|
|
|
|
|
|
|
|
|
|
if errors.IsInvalid(err) {
|
|
|
|
|
// NOTE: This might not be ideal but is currently required to deal with the forbidden error by recreating the statefulset
|
|
|
|
|
// # Why do we recreate statefulsets instead of updating their desired replicas?
|
|
|
|
|
//
|
|
|
|
|
// A statefulset cannot add more pods when not all the pods are running.
|
|
|
|
|
// Our ephemeral runners' pods that have finished running become Completed(Phase=Succeeded).
|
|
|
|
|
// So creating one statefulset per a batch of ephemeral runners is the only way for us to add more replicas.
|
|
|
|
|
//
|
|
|
|
|
// # Why do we recreate statefulsets instead of updating fields other than replicas?
|
|
|
|
|
//
|
|
|
|
|
// That's because Kubernetes doesn't allow updating anything other than replicas, template, and updateStrategy.
|
|
|
|
|
// And the nature of ephemeral runner pods requires you to create a statefulset per a batch of new runner pods so
|
|
|
|
|
// we have really no other choice.
|
|
|
|
|
//
|
|
|
|
|
// If you're curious, the below is the error message you will get when you tried to update forbidden StatefulSet field(s):
|
|
|
|
|
//
|
|
|
|
|
// 2021-06-13T07:19:52.760Z ERROR actions-runner-controller.runnerset Failed to patch statefulset
|
|
|
|
|
// {"runnerset": "default/example-runnerset", "error": "StatefulSet.apps \"example-runnerset\" is invalid: s
|
|
|
|
|
@ -146,60 +140,173 @@ func (r *RunnerSetReconciler) Reconcile(ctx context.Context, req ctrl.Request) (
|
|
|
|
|
// are forbidden"}
|
|
|
|
|
//
|
|
|
|
|
// Even though the error message includes "Forbidden", this error's reason is "Invalid".
|
|
|
|
|
// That's why we're using errors.IsInvalid above.
|
|
|
|
|
// So we used to match these errors by using errors.IsInvalid. But that's another story...
|
|
|
|
|
|
|
|
|
|
if err := r.Client.Delete(ctx, liveStatefulSet); err != nil {
|
|
|
|
|
log.Error(err, "Failed to delete statefulset for force-update")
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
log.Info("Deleted statefulset for force-update")
|
|
|
|
|
}
|
|
|
|
|
var lastSyncTime *time.Time
|
|
|
|
|
|
|
|
|
|
for _, ss := range statefulsets {
|
|
|
|
|
ss := ss
|
|
|
|
|
|
|
|
|
|
log := log.WithValues("statefulset", types.NamespacedName{Namespace: ss.Namespace, Name: ss.Name})
|
|
|
|
|
|
|
|
|
|
res, err := r.getPodsForStatefulset(ctx, log, &ss)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// We requeue in order to clean up old runner replica sets later.
|
|
|
|
|
// Otherwise, they aren't cleaned up until the next re-sync interval.
|
|
|
|
|
return ctrl.Result{RequeueAfter: 5 * time.Second}, nil
|
|
|
|
|
if !res.statefulset.DeletionTimestamp.IsZero() {
|
|
|
|
|
continue
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if res.statefulset.Annotations != nil {
|
|
|
|
|
if a, ok := res.statefulset.Annotations[SyncTimeAnnotationKey]; ok {
|
|
|
|
|
t, err := time.Parse(time.RFC3339, a)
|
|
|
|
|
if err == nil {
|
|
|
|
|
if lastSyncTime == nil || lastSyncTime.Before(t) {
|
|
|
|
|
lastSyncTime = &t
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
statefulsetsPerTemplateHash[res.templateHash] = append(statefulsetsPerTemplateHash[res.templateHash], res)
|
|
|
|
|
|
|
|
|
|
if res.total > 0 && res.total == res.completed {
|
|
|
|
|
if err := r.Client.Delete(ctx, &ss); err != nil {
|
|
|
|
|
log.Error(err, "Unable to delete statefulset")
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
log.V(2).Info("Deleted completed statefulset")
|
|
|
|
|
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var replicas int32 = 1
|
|
|
|
|
if ss.Spec.Replicas != nil {
|
|
|
|
|
replicas = *ss.Spec.Replicas
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ss.Status.Replicas != replicas {
|
|
|
|
|
log.V(2).Info("Waiting for statefulset to sync", "desiredReplicas", replicas, "currentReplicas", ss.Status.Replicas)
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
currentStatefulSets := statefulsetsPerTemplateHash[desiredTemplateHash]
|
|
|
|
|
|
|
|
|
|
sort.SliceStable(currentStatefulSets, func(i, j int) bool {
|
|
|
|
|
return currentStatefulSets[i].statefulset.CreationTimestamp.Before(¤tStatefulSets[j].statefulset.CreationTimestamp)
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
if len(currentStatefulSets) > 0 {
|
|
|
|
|
timestampFirst := currentStatefulSets[0].statefulset.CreationTimestamp
|
|
|
|
|
timestampLast := currentStatefulSets[len(currentStatefulSets)-1].statefulset.CreationTimestamp
|
|
|
|
|
var names []string
|
|
|
|
|
for _, ss := range currentStatefulSets {
|
|
|
|
|
names = append(names, ss.statefulset.Name)
|
|
|
|
|
}
|
|
|
|
|
log.V(2).Info("Detected some current statefulsets", "creationTimestampFirst", timestampFirst, "creationTimestampLast", timestampLast, "statefulsets", names)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var pending, running int
|
|
|
|
|
|
|
|
|
|
for _, ss := range currentStatefulSets {
|
|
|
|
|
pending += ss.pending
|
|
|
|
|
running += ss.running
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const defaultReplicas = 1
|
|
|
|
|
|
|
|
|
|
var replicasOfLiveStatefulSet *int
|
|
|
|
|
if liveStatefulSet.Spec.Replicas != nil {
|
|
|
|
|
v := int(*liveStatefulSet.Spec.Replicas)
|
|
|
|
|
replicasOfLiveStatefulSet = &v
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var replicasOfDesiredStatefulSet *int
|
|
|
|
|
if desiredStatefulSet.Spec.Replicas != nil {
|
|
|
|
|
v := int(*desiredStatefulSet.Spec.Replicas)
|
|
|
|
|
replicasOfDesiredStatefulSet = &v
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
currentDesiredReplicas := getIntOrDefault(replicasOfLiveStatefulSet, defaultReplicas)
|
|
|
|
|
newDesiredReplicas := getIntOrDefault(replicasOfDesiredStatefulSet, defaultReplicas)
|
|
|
|
|
|
|
|
|
|
// Please add more conditions that we can in-place update the newest runnerreplicaset without disruption
|
|
|
|
|
if currentDesiredReplicas != newDesiredReplicas {
|
|
|
|
|
v := int32(newDesiredReplicas)
|
|
|
|
|
log.V(2).Info("Found some pods across statefulset(s)", "pending", pending, "running", running, "desired", newDesiredReplicas, "statefulsets", len(statefulsets))
|
|
|
|
|
|
|
|
|
|
updated := liveStatefulSet.DeepCopy()
|
|
|
|
|
updated.Spec.Replicas = &v
|
|
|
|
|
effectiveTime := runnerSet.Spec.EffectiveTime
|
|
|
|
|
ephemeral := runnerSet.Spec.Ephemeral == nil || *runnerSet.Spec.Ephemeral
|
|
|
|
|
|
|
|
|
|
if err := r.Client.Patch(ctx, updated, client.MergeFrom(liveStatefulSet)); err != nil {
|
|
|
|
|
log.Error(err, "Failed to update statefulset")
|
|
|
|
|
if newDesiredReplicas > pending+running && ephemeral && lastSyncTime != nil && effectiveTime != nil && lastSyncTime.After(effectiveTime.Time) {
|
|
|
|
|
log.V(2).Info("Detected that some ephemeral runners have disappeared. Usually this is due to that ephemeral runner completions so ARC does not create new runners until EffectiveTime is updated.", "lastSyncTime", metav1.Time{Time: *lastSyncTime}, "effectiveTime", *effectiveTime, "desired", newDesiredReplicas, "pending", pending, "running", running)
|
|
|
|
|
} else if newDesiredReplicas > pending+running {
|
|
|
|
|
num := newDesiredReplicas - (pending + running)
|
|
|
|
|
|
|
|
|
|
for i := 0; i < num; i++ {
|
|
|
|
|
// Add more replicas
|
|
|
|
|
addedReplicas := int32(1)
|
|
|
|
|
|
|
|
|
|
create := desiredStatefulSet.DeepCopy()
|
|
|
|
|
create.Spec.Replicas = &addedReplicas
|
|
|
|
|
if err := r.Client.Create(ctx, create); err != nil {
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
log.V(2).Info("Created statefulset(s) to add more replicas", "num", num)
|
|
|
|
|
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
} else if newDesiredReplicas < running {
|
|
|
|
|
var retained int
|
|
|
|
|
var lastIndex int
|
|
|
|
|
for i := len(currentStatefulSets) - 1; i >= 0; i-- {
|
|
|
|
|
ss := currentStatefulSets[i]
|
|
|
|
|
retained += ss.running
|
|
|
|
|
if retained >= newDesiredReplicas {
|
|
|
|
|
lastIndex = i
|
|
|
|
|
break
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if retained == newDesiredReplicas {
|
|
|
|
|
for i := 0; i < lastIndex; i++ {
|
|
|
|
|
ss := currentStatefulSets[i]
|
|
|
|
|
log := log.WithValues("statefulset", types.NamespacedName{Namespace: ss.statefulset.Namespace, Name: ss.statefulset.Name})
|
|
|
|
|
if err := r.Client.Delete(ctx, ss.statefulset); err != nil {
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
log.V(2).Info("Deleted redundant statefulset", "i", i, "lastIndex", lastIndex)
|
|
|
|
|
}
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
} else if retained > newDesiredReplicas {
|
|
|
|
|
log.V(2).Info("Waiting sync before scale down", "retained", retained, "newDesiredReplicas", newDesiredReplicas, "lastIndex", lastIndex)
|
|
|
|
|
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
} else {
|
|
|
|
|
log.Info("Invalid state", "retained", retained, "newDesiredReplicas", newDesiredReplicas, "lastIndex", lastIndex)
|
|
|
|
|
panic("crashed due to invalid state")
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for _, sss := range statefulsetsPerTemplateHash {
|
|
|
|
|
for _, ss := range sss {
|
|
|
|
|
if ss.templateHash != desiredTemplateHash {
|
|
|
|
|
if ss.statefulset.DeletionTimestamp.IsZero() {
|
|
|
|
|
if err := r.Client.Delete(ctx, ss.statefulset); err != nil {
|
|
|
|
|
log.Error(err, "Unable to delete statefulset")
|
|
|
|
|
return ctrl.Result{}, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
log.V(2).Info("Deleted redundant and outdated statefulset")
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
statusReplicas := int(liveStatefulSet.Status.Replicas)
|
|
|
|
|
statusReadyReplicas := int(liveStatefulSet.Status.ReadyReplicas)
|
|
|
|
|
totalCurrentReplicas := int(liveStatefulSet.Status.CurrentReplicas)
|
|
|
|
|
updatedReplicas := int(liveStatefulSet.Status.UpdatedReplicas)
|
|
|
|
|
var statusReplicas, statusReadyReplicas, totalCurrentReplicas, updatedReplicas int
|
|
|
|
|
|
|
|
|
|
for _, ss := range currentStatefulSets {
|
|
|
|
|
statusReplicas += int(ss.statefulset.Status.Replicas)
|
|
|
|
|
statusReadyReplicas += int(ss.statefulset.Status.ReadyReplicas)
|
|
|
|
|
totalCurrentReplicas += int(ss.statefulset.Status.CurrentReplicas)
|
|
|
|
|
updatedReplicas += int(ss.statefulset.Status.UpdatedReplicas)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
status := runnerSet.Status.DeepCopy()
|
|
|
|
|
|
|
|
|
|
@ -224,6 +331,64 @@ func (r *RunnerSetReconciler) Reconcile(ctx context.Context, req ctrl.Request) (
|
|
|
|
|
return ctrl.Result{}, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
type podsForStatefulset struct {
|
|
|
|
|
total int
|
|
|
|
|
completed int
|
|
|
|
|
running int
|
|
|
|
|
terminating int
|
|
|
|
|
pending int
|
|
|
|
|
templateHash string
|
|
|
|
|
statefulset *appsv1.StatefulSet
|
|
|
|
|
pods []corev1.Pod
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func (r *RunnerSetReconciler) getPodsForStatefulset(ctx context.Context, log logr.Logger, ss *appsv1.StatefulSet) (*podsForStatefulset, error) {
|
|
|
|
|
var podList corev1.PodList
|
|
|
|
|
|
|
|
|
|
if err := r.Client.List(ctx, &podList, client.MatchingLabels(ss.Spec.Template.ObjectMeta.Labels)); err != nil {
|
|
|
|
|
log.Error(err, "Failed to list pods managed by statefulset")
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var completed, running, terminating, pending, total int
|
|
|
|
|
|
|
|
|
|
for _, pod := range podList.Items {
|
|
|
|
|
if owner := metav1.GetControllerOf(&pod); owner == nil || owner.Kind != "StatefulSet" || owner.Name != ss.Name {
|
|
|
|
|
continue
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
total++
|
|
|
|
|
|
|
|
|
|
if runnerPodOrContainerIsStopped(&pod) {
|
|
|
|
|
completed++
|
|
|
|
|
} else if pod.Status.Phase == corev1.PodRunning {
|
|
|
|
|
running++
|
|
|
|
|
} else if !pod.DeletionTimestamp.IsZero() {
|
|
|
|
|
terminating++
|
|
|
|
|
} else {
|
|
|
|
|
pending++
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
templateHash, ok := getStatefulSetTemplateHash(ss)
|
|
|
|
|
if !ok {
|
|
|
|
|
log.Info("Failed to get template hash of statefulset. It must be in an invalid state. Please manually delete the statefulset so that it is recreated")
|
|
|
|
|
|
|
|
|
|
return nil, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return &podsForStatefulset{
|
|
|
|
|
total: total,
|
|
|
|
|
completed: completed,
|
|
|
|
|
running: running,
|
|
|
|
|
terminating: terminating,
|
|
|
|
|
pending: pending,
|
|
|
|
|
templateHash: templateHash,
|
|
|
|
|
statefulset: ss,
|
|
|
|
|
pods: podList.Items,
|
|
|
|
|
}, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func getStatefulSetTemplateHash(rs *appsv1.StatefulSet) (string, bool) {
|
|
|
|
|
hash, ok := rs.Labels[LabelKeyRunnerTemplateHash]
|
|
|
|
|
|
|
|
|
|
@ -288,9 +453,12 @@ func (r *RunnerSetReconciler) newStatefulSet(runnerSet *v1alpha1.RunnerSet) (*ap
|
|
|
|
|
rs := appsv1.StatefulSet{
|
|
|
|
|
TypeMeta: metav1.TypeMeta{},
|
|
|
|
|
ObjectMeta: metav1.ObjectMeta{
|
|
|
|
|
Name: runnerSet.ObjectMeta.Name,
|
|
|
|
|
GenerateName: runnerSet.ObjectMeta.Name + "-",
|
|
|
|
|
Namespace: runnerSet.ObjectMeta.Namespace,
|
|
|
|
|
Labels: CloneAndAddLabel(runnerSet.ObjectMeta.Labels, LabelKeyRunnerTemplateHash, templateHash),
|
|
|
|
|
Annotations: map[string]string{
|
|
|
|
|
SyncTimeAnnotationKey: time.Now().Format(time.RFC3339),
|
|
|
|
|
},
|
|
|
|
|
},
|
|
|
|
|
Spec: runnerSetWithOverrides.StatefulSetSpec,
|
|
|
|
|
}
|
|
|
|
|
@ -310,6 +478,22 @@ func (r *RunnerSetReconciler) SetupWithManager(mgr ctrl.Manager) error {
|
|
|
|
|
|
|
|
|
|
r.Recorder = mgr.GetEventRecorderFor(name)
|
|
|
|
|
|
|
|
|
|
if err := mgr.GetFieldIndexer().IndexField(context.TODO(), &appsv1.StatefulSet{}, runnerSetOwnerKey, func(rawObj client.Object) []string {
|
|
|
|
|
set := rawObj.(*appsv1.StatefulSet)
|
|
|
|
|
owner := metav1.GetControllerOf(set)
|
|
|
|
|
if owner == nil {
|
|
|
|
|
return nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if owner.APIVersion != v1alpha1.GroupVersion.String() || owner.Kind != "RunnerSet" {
|
|
|
|
|
return nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return []string{owner.Name}
|
|
|
|
|
}); err != nil {
|
|
|
|
|
return err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return ctrl.NewControllerManagedBy(mgr).
|
|
|
|
|
For(&v1alpha1.RunnerSet{}).
|
|
|
|
|
Owns(&appsv1.StatefulSet{}).
|
|
|
|
|
|