Skip to content

Commit

Permalink
MS: improve replica defaulting for autoscaler
Browse files Browse the repository at this point in the history
  • Loading branch information
aiden-von committed Nov 21, 2023
1 parent 0eb51f0 commit addb065
Show file tree
Hide file tree
Showing 11 changed files with 368 additions and 39 deletions.
17 changes: 15 additions & 2 deletions api/v1beta1/machineset_types.go
Original file line number Diff line number Diff line change
Expand Up @@ -41,9 +41,22 @@ type MachineSetSpec struct {

// Replicas is the number of desired replicas.
// This is a pointer to distinguish between explicit zero and unspecified.
// Defaults to 1.
//
// Defaults to:
// * if the Kubernetes autoscaler min size and max size annotations are set:
// - if it's a new MachineSet, use min size
// - if the replicas field of the old MachineSet is < min size, use min size
// - if the replicas field of the old MachineSet is > max size, use max size
// - if the replicas field of the old MachineSet is in the (min size, max size) range, keep the value from the oldMS
// * otherwise use 1
// Note: Defaulting will be run whenever the replicas field is not set:
// * A new MachineSet is created with replicas not set.
// * On an existing MachineSet the replicas field was first set and is now unset.
// Those cases are especially relevant for the following Kubernetes autoscaler use cases:
// * A new MachineSet is created and replicas should be managed by the autoscaler
// * An existing MachineSet which initially wasn't controlled by the autoscaler
// should be later controlled by the autoscaler
// +optional
// +kubebuilder:default=1
Replicas *int32 `json:"replicas,omitempty"`

// MinReadySeconds is the minimum number of seconds for which a Node for a newly created machine should be ready before considering the replica available.
Expand Down
2 changes: 1 addition & 1 deletion api/v1beta1/zz_generated.openapi.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

20 changes: 16 additions & 4 deletions config/crd/bases/cluster.x-k8s.io_machinesets.yaml

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

14 changes: 7 additions & 7 deletions docs/book/src/tasks/automated-machine-management/autoscaling.md
Original file line number Diff line number Diff line change
Expand Up @@ -12,17 +12,17 @@ from the [Autoscaler project documentation](https://github.com/kubernetes/autosc

<aside class="note warning">

<h1>Defaulting of the MachineDeployment replicas field</h1>
<h1>Defaulting of the MachineDeployment, MachineSet replicas field</h1>

Please note that the MachineDeployment replicas field has special defaulting logic to provide a smooth integration with the autoscaler.
The replica field is defaulted based on the autoscaler min and max size annotations.The goal is to pick a default value which is inside
Please note that the MachineDeployment and MachineSet replicas field has special defaulting logic to provide a smooth integration with the autoscaler.
The replica field is defaulted based on the autoscaler min and max size annotations.The goal is to pick a default value which is inside
the (min size, max size) range so the autoscaler can take control of the replicase field.

The defaulting logic is as follows:
* if the autoscaler min size and max size annotations are set:
* if it's a new MachineDeployment, use min size
* if the replicas field of the old MachineDeployment is < min size, use min size
* if the replicas field of the old MachineDeployment is > max size, use max size
* if the replicas field of the old MachineDeployment is in the (min size, max size) range, keep the value from the oldMD
* if it's a new MachineDeployment or MachineSet, use min size
* if the replicas field of the old MachineDeployment or MachineSet is < min size, use min size
* if the replicas field of the old MachineDeployment or MachineSet is > max size, use max size
* if the replicas field of the old MachineDeployment or MachineSet is in the (min size, max size) range, keep the value from the oldMD or oldMS
* otherwise, use 1
</aside>
Original file line number Diff line number Diff line change
Expand Up @@ -40,6 +40,7 @@ import (
"sigs.k8s.io/controller-runtime/pkg/client/fake"
"sigs.k8s.io/controller-runtime/pkg/log"
"sigs.k8s.io/controller-runtime/pkg/reconcile"
"sigs.k8s.io/controller-runtime/pkg/webhook/admission"

clusterv1 "sigs.k8s.io/cluster-api/api/v1beta1"
"sigs.k8s.io/cluster-api/api/v1beta1/index"
Expand Down Expand Up @@ -1249,7 +1250,9 @@ func TestMachineHealthCheck_Reconcile(t *testing.T) {
},
},
}
g.Expect((&webhooks.MachineSet{}).Default(ctx, machineSet)).Should(Succeed())

reqCtx := admission.NewContextWithRequest(ctx, admission.Request{})
g.Expect((&webhooks.MachineSet{}).Default(reqCtx, machineSet)).Should(Succeed())
g.Expect(env.Create(ctx, machineSet)).To(Succeed())

// Ensure machines have been created.
Expand Down
5 changes: 2 additions & 3 deletions internal/controllers/topology/cluster/reconcile_state_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -3241,9 +3241,8 @@ func newFakeMachineDeploymentTopologyState(name string, infrastructureMachineTem

scheme := runtime.NewScheme()
_ = clusterv1.AddToScheme(scheme)
if err := (&webhooks.MachineDeployment{
Decoder: admission.NewDecoder(scheme),
}).Default(admission.NewContextWithRequest(ctx, admission.Request{}), mdState.Object); err != nil {
if err := (&webhooks.MachineDeployment{}).
Default(admission.NewContextWithRequest(ctx, admission.Request{}), mdState.Object); err != nil {
panic(err)
}
return mdState
Expand Down
8 changes: 4 additions & 4 deletions internal/webhooks/machinedeployment.go
Original file line number Diff line number Diff line change
Expand Up @@ -42,8 +42,8 @@ import (
)

func (webhook *MachineDeployment) SetupWebhookWithManager(mgr ctrl.Manager) error {
if webhook.Decoder == nil {
webhook.Decoder = admission.NewDecoder(mgr.GetScheme())
if webhook.decoder == nil {
webhook.decoder = admission.NewDecoder(mgr.GetScheme())
}

return ctrl.NewWebhookManagedBy(mgr).
Expand All @@ -58,7 +58,7 @@ func (webhook *MachineDeployment) SetupWebhookWithManager(mgr ctrl.Manager) erro

// MachineDeployment implements a validation and defaulting webhook for MachineDeployment.
type MachineDeployment struct {
Decoder *admission.Decoder
decoder *admission.Decoder
}

var _ webhook.CustomDefaulter = &MachineDeployment{}
Expand All @@ -83,7 +83,7 @@ func (webhook *MachineDeployment) Default(ctx context.Context, obj runtime.Objec
var oldMD *clusterv1.MachineDeployment
if req.Operation == v1.Update {
oldMD = &clusterv1.MachineDeployment{}
if err := webhook.Decoder.DecodeRaw(req.OldObject, oldMD); err != nil {
if err := webhook.decoder.DecodeRaw(req.OldObject, oldMD); err != nil {
return errors.Wrapf(err, "failed to decode oldObject to MachineDeployment")
}
}
Expand Down
10 changes: 5 additions & 5 deletions internal/webhooks/machinedeployment_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -52,7 +52,7 @@ func TestMachineDeploymentDefault(t *testing.T) {
scheme := runtime.NewScheme()
g.Expect(clusterv1.AddToScheme(scheme)).To(Succeed())
webhook := &MachineDeployment{
Decoder: admission.NewDecoder(scheme),
decoder: admission.NewDecoder(scheme),
}

reqCtx := admission.NewContextWithRequest(ctx, admission.Request{
Expand Down Expand Up @@ -403,7 +403,7 @@ func TestMachineDeploymentValidation(t *testing.T) {
scheme := runtime.NewScheme()
g.Expect(clusterv1.AddToScheme(scheme)).To(Succeed())
webhook := MachineDeployment{
Decoder: admission.NewDecoder(scheme),
decoder: admission.NewDecoder(scheme),
}

if tt.expectErr {
Expand Down Expand Up @@ -475,7 +475,7 @@ func TestMachineDeploymentVersionValidation(t *testing.T) {
scheme := runtime.NewScheme()
g.Expect(clusterv1.AddToScheme(scheme)).To(Succeed())
webhook := MachineDeployment{
Decoder: admission.NewDecoder(scheme),
decoder: admission.NewDecoder(scheme),
}

if tt.expectErr {
Expand Down Expand Up @@ -537,7 +537,7 @@ func TestMachineDeploymentClusterNameImmutable(t *testing.T) {
scheme := runtime.NewScheme()
g.Expect(clusterv1.AddToScheme(scheme)).To(Succeed())
webhook := MachineDeployment{
Decoder: admission.NewDecoder(scheme),
decoder: admission.NewDecoder(scheme),
}

warnings, err := webhook.ValidateUpdate(ctx, oldMD, newMD)
Expand Down Expand Up @@ -589,7 +589,7 @@ func TestMachineDeploymentTemplateMetadataValidation(t *testing.T) {
scheme := runtime.NewScheme()
g.Expect(clusterv1.AddToScheme(scheme)).To(Succeed())
webhook := MachineDeployment{
Decoder: admission.NewDecoder(scheme),
decoder: admission.NewDecoder(scheme),
}

if tt.expectErr {
Expand Down
139 changes: 137 additions & 2 deletions internal/webhooks/machineset.go
Original file line number Diff line number Diff line change
Expand Up @@ -19,14 +19,18 @@ package webhooks
import (
"context"
"fmt"
"strconv"
"strings"

"github.com/pkg/errors"
v1 "k8s.io/api/admission/v1"
apierrors "k8s.io/apimachinery/pkg/api/errors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/labels"
"k8s.io/apimachinery/pkg/runtime"
"k8s.io/apimachinery/pkg/util/sets"
"k8s.io/apimachinery/pkg/util/validation/field"
"k8s.io/utils/pointer"
ctrl "sigs.k8s.io/controller-runtime"
"sigs.k8s.io/controller-runtime/pkg/client"
"sigs.k8s.io/controller-runtime/pkg/webhook"
Expand All @@ -39,6 +43,10 @@ import (
)

func (webhook *MachineSet) SetupWebhookWithManager(mgr ctrl.Manager) error {
if webhook.decoder == nil {
webhook.decoder = admission.NewDecoder(mgr.GetScheme())
}

return ctrl.NewWebhookManagedBy(mgr).
For(&clusterv1.MachineSet{}).
WithDefaulter(webhook).
Expand All @@ -50,23 +58,49 @@ func (webhook *MachineSet) SetupWebhookWithManager(mgr ctrl.Manager) error {
// +kubebuilder:webhook:verbs=create;update,path=/mutate-cluster-x-k8s-io-v1beta1-machineset,mutating=true,failurePolicy=fail,matchPolicy=Equivalent,groups=cluster.x-k8s.io,resources=machinesets,versions=v1beta1,name=default.machineset.cluster.x-k8s.io,sideEffects=None,admissionReviewVersions=v1;v1beta1

// MachineSet implements a validation and defaulting webhook for MachineSet.
type MachineSet struct{}
type MachineSet struct {
decoder *admission.Decoder
}

var _ webhook.CustomDefaulter = &MachineSet{}
var _ webhook.CustomValidator = &MachineSet{}

// Default sets default MachineSet field values.
func (webhook *MachineSet) Default(_ context.Context, obj runtime.Object) error {
func (webhook *MachineSet) Default(ctx context.Context, obj runtime.Object) error {
m, ok := obj.(*clusterv1.MachineSet)
if !ok {
return apierrors.NewBadRequest(fmt.Sprintf("expected a MachineSet but got a %T", obj))
}

req, err := admission.RequestFromContext(ctx)
if err != nil {
return err
}

dryRun := false
if req.DryRun != nil {
dryRun = *req.DryRun
}

var oldMS *clusterv1.MachineSet
if req.Operation == v1.Update {
oldMS = &clusterv1.MachineSet{}
if err := webhook.decoder.DecodeRaw(req.OldObject, oldMS); err != nil {
return errors.Wrapf(err, "failed to decode oldObject to MachineSet")
}
}

if m.Labels == nil {
m.Labels = make(map[string]string)
}
m.Labels[clusterv1.ClusterNameLabel] = m.Spec.ClusterName

replicas, err := calculateMachineSetReplicas(ctx, oldMS, m, dryRun)
if err != nil {
return err
}
m.Spec.Replicas = pointer.Int32(replicas)

if m.Spec.DeletePolicy == "" {
randomPolicy := string(clusterv1.RandomMachineSetDeletePolicy)
m.Spec.DeletePolicy = randomPolicy
Expand Down Expand Up @@ -219,3 +253,104 @@ func validateSkippedMachineSetPreflightChecks(o client.Object) *field.Error {
}
return nil
}

// calculateMachineSetReplicas calculates the default value of the replicas field.
// The value will be calculated based on the following logic:
// * if replicas is already set on newMS, keep the current value
// * if the autoscaler min size and max size annotations are set:
// - if it's a new MachineSet, use min size
// - if the replicas field of the old MachineSet is < min size, use min size
// - if the replicas field of the old MachineSet is > max size, use max size
// - if the replicas field of the old MachineSet is in the (min size, max size) range, keep the value from the oldMS
//
// * otherwise use 1
//
// The goal of this logic is to provide a smoother UX for clusters using the Kubernetes autoscaler.
// Note: Autoscaler only takes over control of the replicas field if the replicas value is in the (min size, max size) range.
//
// We are supporting the following use cases:
// * A new MS is created and replicas should be managed by the autoscaler
// - Either via the default annotation or via the min size and max size annotations the replicas field
// is defaulted to a value which is within the (min size, max size) range so the autoscaler can take control.
//
// * An existing MS which initially wasn't controlled by the autoscaler should be later controlled by the autoscaler
// - To adopt an existing MS users can use the default, min size and max size annotations to enable the autoscaler
// and to ensure the replicas field is within the (min size, max size) range. Without the annotations handing over
// control to the autoscaler by unsetting the replicas field would lead to the field being set to 1. This is very
// disruptive for existing Machines and if 1 is outside the (min size, max size) range the autoscaler won't take
// control.
//
// Notes:
// - While the min size and max size annotations of the autoscaler provide the best UX, other autoscalers can use the
// DefaultReplicasAnnotation if they have similar use cases.
func calculateMachineSetReplicas(ctx context.Context, oldMS *clusterv1.MachineSet, newMS *clusterv1.MachineSet, dryRun bool) (int32, error) {
// If replicas is already set => Keep the current value.
if newMS.Spec.Replicas != nil {
return *newMS.Spec.Replicas, nil
}

log := ctrl.LoggerFrom(ctx)

// If both autoscaler annotations are set, use them to calculate the default value.
minSizeString, hasMinSizeAnnotation := newMS.Annotations[clusterv1.AutoscalerMinSizeAnnotation]
maxSizeString, hasMaxSizeAnnotation := newMS.Annotations[clusterv1.AutoscalerMaxSizeAnnotation]
if hasMinSizeAnnotation && hasMaxSizeAnnotation {
minSize, err := strconv.ParseInt(minSizeString, 10, 32)
if err != nil {
return 0, errors.Wrapf(err, "failed to caculate MachineSet replicas value: could not parse the value of the %q annotation", clusterv1.AutoscalerMinSizeAnnotation)
}
maxSize, err := strconv.ParseInt(maxSizeString, 10, 32)
if err != nil {
return 0, errors.Wrapf(err, "failed to caculate MachineSet replicas value: could not parse the value of the %q annotation", clusterv1.AutoscalerMaxSizeAnnotation)
}

// If it's a new MachineSet => Use the min size.
// Note: This will result in a scale up to get into the range where autoscaler takes over.
if oldMS == nil {
if !dryRun {
log.V(2).Info(fmt.Sprintf("Replica field has been defaulted to %d based on the %s annotation (MS is a new MS)", minSize, clusterv1.AutoscalerMinSizeAnnotation))
}
return int32(minSize), nil
}

// Otherwise we are handing over the control for the replicas field for an existing MachineSet
// to the autoscaler.

switch {
// If the old MachineSet doesn't have replicas set => Use the min size.
// Note: As defaulting always sets the replica field, this case should not be possible
// We only have this handling to be 100% safe against panics.
case oldMS.Spec.Replicas == nil:
if !dryRun {
log.V(2).Info(fmt.Sprintf("Replica field has been defaulted to %d based on the %s annotation (old MS didn't have replicas set)", minSize, clusterv1.AutoscalerMinSizeAnnotation))
}
return int32(minSize), nil
// If the old MachineSet replicas are lower than min size => Use the min size.
// Note: This will result in a scale up to get into the range where autoscaler takes over.
case *oldMS.Spec.Replicas < int32(minSize):
if !dryRun {
log.V(2).Info(fmt.Sprintf("Replica field has been defaulted to %d based on the %s annotation (old MS had replicas below min size)", minSize, clusterv1.AutoscalerMinSizeAnnotation))
}
return int32(minSize), nil
// If the old MachineSet replicas are higher than max size => Use the max size.
// Note: This will result in a scale down to get into the range where autoscaler takes over.
case *oldMS.Spec.Replicas > int32(maxSize):
if !dryRun {
log.V(2).Info(fmt.Sprintf("Replica field has been defaulted to %d based on the %s annotation (old MS had replicas above max size)", maxSize, clusterv1.AutoscalerMaxSizeAnnotation))
}
return int32(maxSize), nil
// If the old MachineSet replicas are between min and max size => Keep the current value.
default:
if !dryRun {
log.V(2).Info(fmt.Sprintf("Replica field has been defaulted to %d based on replicas of the old MachineSet (old MS had replicas within min size / max size range)", *oldMS.Spec.Replicas))
}
return *oldMS.Spec.Replicas, nil
}
}

// If neither the default nor the autoscaler annotations are set => Default to 1.
if !dryRun {
log.V(2).Info("Replica field has been defaulted to 1")
}
return 1, nil
}
Loading

0 comments on commit addb065

Please sign in to comment.