123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504 |
- /*
- Copyright 2014 The Kubernetes Authors.
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
- http://www.apache.org/licenses/LICENSE-2.0
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- */
- package kubectl
- import (
- "fmt"
- "strconv"
- "time"
- "k8s.io/kubernetes/pkg/api"
- "k8s.io/kubernetes/pkg/api/errors"
- "k8s.io/kubernetes/pkg/api/unversioned"
- "k8s.io/kubernetes/pkg/apis/apps"
- "k8s.io/kubernetes/pkg/apis/batch"
- "k8s.io/kubernetes/pkg/apis/extensions"
- client "k8s.io/kubernetes/pkg/client/unversioned"
- "k8s.io/kubernetes/pkg/fields"
- "k8s.io/kubernetes/pkg/util/wait"
- "k8s.io/kubernetes/pkg/watch"
- )
- // Scaler provides an interface for resources that can be scaled.
- type Scaler interface {
- // Scale scales the named resource after checking preconditions. It optionally
- // retries in the event of resource version mismatch (if retry is not nil),
- // and optionally waits until the status of the resource matches newSize (if wait is not nil)
- Scale(namespace, name string, newSize uint, preconditions *ScalePrecondition, retry, wait *RetryParams) error
- // ScaleSimple does a simple one-shot attempt at scaling - not useful on its own, but
- // a necessary building block for Scale
- ScaleSimple(namespace, name string, preconditions *ScalePrecondition, newSize uint) (updatedResourceVersion string, err error)
- }
- func ScalerFor(kind unversioned.GroupKind, c client.Interface) (Scaler, error) {
- switch kind {
- case api.Kind("ReplicationController"):
- return &ReplicationControllerScaler{c}, nil
- case extensions.Kind("ReplicaSet"):
- return &ReplicaSetScaler{c.Extensions()}, nil
- case extensions.Kind("Job"), batch.Kind("Job"):
- return &JobScaler{c.Batch()}, nil // Either kind of job can be scaled with Batch interface.
- case apps.Kind("PetSet"):
- return &PetSetScaler{c.Apps()}, nil
- case extensions.Kind("Deployment"):
- return &DeploymentScaler{c.Extensions()}, nil
- }
- return nil, fmt.Errorf("no scaler has been implemented for %q", kind)
- }
- // ScalePrecondition describes a condition that must be true for the scale to take place
- // If CurrentSize == -1, it is ignored.
- // If CurrentResourceVersion is the empty string, it is ignored.
- // Otherwise they must equal the values in the resource for it to be valid.
- type ScalePrecondition struct {
- Size int
- ResourceVersion string
- }
- // A PreconditionError is returned when a resource fails to match
- // the scale preconditions passed to kubectl.
- type PreconditionError struct {
- Precondition string
- ExpectedValue string
- ActualValue string
- }
- func (pe PreconditionError) Error() string {
- return fmt.Sprintf("Expected %s to be %s, was %s", pe.Precondition, pe.ExpectedValue, pe.ActualValue)
- }
- type ScaleErrorType int
- const (
- ScaleGetFailure ScaleErrorType = iota
- ScaleUpdateFailure
- ScaleUpdateConflictFailure
- )
- // A ScaleError is returned when a scale request passes
- // preconditions but fails to actually scale the controller.
- type ScaleError struct {
- FailureType ScaleErrorType
- ResourceVersion string
- ActualError error
- }
- func (c ScaleError) Error() string {
- return fmt.Sprintf(
- "Scaling the resource failed with: %v; Current resource version %s",
- c.ActualError, c.ResourceVersion)
- }
- // RetryParams encapsulates the retry parameters used by kubectl's scaler.
- type RetryParams struct {
- Interval, Timeout time.Duration
- }
- func NewRetryParams(interval, timeout time.Duration) *RetryParams {
- return &RetryParams{interval, timeout}
- }
- // ScaleCondition is a closure around Scale that facilitates retries via util.wait
- func ScaleCondition(r Scaler, precondition *ScalePrecondition, namespace, name string, count uint, updatedResourceVersion *string) wait.ConditionFunc {
- return func() (bool, error) {
- rv, err := r.ScaleSimple(namespace, name, precondition, count)
- if updatedResourceVersion != nil {
- *updatedResourceVersion = rv
- }
- switch e, _ := err.(ScaleError); err.(type) {
- case nil:
- return true, nil
- case ScaleError:
- // Retry only on update conflicts.
- if e.FailureType == ScaleUpdateConflictFailure {
- return false, nil
- }
- }
- return false, err
- }
- }
- // ValidatePetSet ensures that the preconditions match. Returns nil if they are valid, an error otherwise.
- func (precondition *ScalePrecondition) ValidatePetSet(ps *apps.PetSet) error {
- if precondition.Size != -1 && int(ps.Spec.Replicas) != precondition.Size {
- return PreconditionError{"replicas", strconv.Itoa(precondition.Size), strconv.Itoa(int(ps.Spec.Replicas))}
- }
- if len(precondition.ResourceVersion) != 0 && ps.ResourceVersion != precondition.ResourceVersion {
- return PreconditionError{"resource version", precondition.ResourceVersion, ps.ResourceVersion}
- }
- return nil
- }
- // ValidateReplicationController ensures that the preconditions match. Returns nil if they are valid, an error otherwise
- func (precondition *ScalePrecondition) ValidateReplicationController(controller *api.ReplicationController) error {
- if precondition.Size != -1 && int(controller.Spec.Replicas) != precondition.Size {
- return PreconditionError{"replicas", strconv.Itoa(precondition.Size), strconv.Itoa(int(controller.Spec.Replicas))}
- }
- if len(precondition.ResourceVersion) != 0 && controller.ResourceVersion != precondition.ResourceVersion {
- return PreconditionError{"resource version", precondition.ResourceVersion, controller.ResourceVersion}
- }
- return nil
- }
- type ReplicationControllerScaler struct {
- c client.Interface
- }
- // ScaleSimple does a simple one-shot attempt at scaling. It returns the
- // resourceVersion of the replication controller if the update is successful.
- func (scaler *ReplicationControllerScaler) ScaleSimple(namespace, name string, preconditions *ScalePrecondition, newSize uint) (string, error) {
- controller, err := scaler.c.ReplicationControllers(namespace).Get(name)
- if err != nil {
- return "", ScaleError{ScaleGetFailure, "Unknown", err}
- }
- if preconditions != nil {
- if err := preconditions.ValidateReplicationController(controller); err != nil {
- return "", err
- }
- }
- controller.Spec.Replicas = int32(newSize)
- updatedRC, err := scaler.c.ReplicationControllers(namespace).Update(controller)
- if err != nil {
- if errors.IsConflict(err) {
- return "", ScaleError{ScaleUpdateConflictFailure, controller.ResourceVersion, err}
- }
- return "", ScaleError{ScaleUpdateFailure, controller.ResourceVersion, err}
- }
- return updatedRC.ObjectMeta.ResourceVersion, nil
- }
- // Scale updates a ReplicationController to a new size, with optional precondition check (if preconditions is not nil),
- // optional retries (if retry is not nil), and then optionally waits for it's replica count to reach the new value
- // (if wait is not nil).
- func (scaler *ReplicationControllerScaler) Scale(namespace, name string, newSize uint, preconditions *ScalePrecondition, retry, waitForReplicas *RetryParams) error {
- if preconditions == nil {
- preconditions = &ScalePrecondition{-1, ""}
- }
- if retry == nil {
- // Make it try only once, immediately
- retry = &RetryParams{Interval: time.Millisecond, Timeout: time.Millisecond}
- }
- var updatedResourceVersion string
- cond := ScaleCondition(scaler, preconditions, namespace, name, newSize, &updatedResourceVersion)
- if err := wait.PollImmediate(retry.Interval, retry.Timeout, cond); err != nil {
- return err
- }
- if waitForReplicas != nil {
- checkRC := func(rc *api.ReplicationController) bool {
- if uint(rc.Spec.Replicas) != newSize {
- // the size is changed by other party. Don't need to wait for the new change to complete.
- return true
- }
- return rc.Status.ObservedGeneration >= rc.Generation && rc.Status.Replicas == rc.Spec.Replicas
- }
- // If number of replicas doesn't change, then the update may not event
- // be sent to underlying databse (we don't send no-op changes).
- // In such case, <updatedResourceVersion> will have value of the most
- // recent update (which may be far in the past) so we may get "too old
- // RV" error from watch or potentially no ReplicationController events
- // will be deliver, since it may already be in the expected state.
- // To protect from these two, we first issue Get() to ensure that we
- // are not already in the expected state.
- currentRC, err := scaler.c.ReplicationControllers(namespace).Get(name)
- if err != nil {
- return err
- }
- if !checkRC(currentRC) {
- watchOptions := api.ListOptions{
- FieldSelector: fields.OneTermEqualSelector("metadata.name", name),
- ResourceVersion: updatedResourceVersion,
- }
- watcher, err := scaler.c.ReplicationControllers(namespace).Watch(watchOptions)
- if err != nil {
- return err
- }
- _, err = watch.Until(waitForReplicas.Timeout, watcher, func(event watch.Event) (bool, error) {
- if event.Type != watch.Added && event.Type != watch.Modified {
- return false, nil
- }
- return checkRC(event.Object.(*api.ReplicationController)), nil
- })
- if err == wait.ErrWaitTimeout {
- return fmt.Errorf("timed out waiting for %q to be synced", name)
- }
- return err
- }
- }
- return nil
- }
- // ValidateReplicaSet ensures that the preconditions match. Returns nil if they are valid, an error otherwise
- func (precondition *ScalePrecondition) ValidateReplicaSet(replicaSet *extensions.ReplicaSet) error {
- if precondition.Size != -1 && int(replicaSet.Spec.Replicas) != precondition.Size {
- return PreconditionError{"replicas", strconv.Itoa(precondition.Size), strconv.Itoa(int(replicaSet.Spec.Replicas))}
- }
- if len(precondition.ResourceVersion) != 0 && replicaSet.ResourceVersion != precondition.ResourceVersion {
- return PreconditionError{"resource version", precondition.ResourceVersion, replicaSet.ResourceVersion}
- }
- return nil
- }
- type ReplicaSetScaler struct {
- c client.ExtensionsInterface
- }
- // ScaleSimple does a simple one-shot attempt at scaling. It returns the
- // resourceVersion of the replicaset if the update is successful.
- func (scaler *ReplicaSetScaler) ScaleSimple(namespace, name string, preconditions *ScalePrecondition, newSize uint) (string, error) {
- rs, err := scaler.c.ReplicaSets(namespace).Get(name)
- if err != nil {
- return "", ScaleError{ScaleGetFailure, "Unknown", err}
- }
- if preconditions != nil {
- if err := preconditions.ValidateReplicaSet(rs); err != nil {
- return "", err
- }
- }
- rs.Spec.Replicas = int32(newSize)
- updatedRS, err := scaler.c.ReplicaSets(namespace).Update(rs)
- if err != nil {
- if errors.IsConflict(err) {
- return "", ScaleError{ScaleUpdateConflictFailure, rs.ResourceVersion, err}
- }
- return "", ScaleError{ScaleUpdateFailure, rs.ResourceVersion, err}
- }
- return updatedRS.ObjectMeta.ResourceVersion, nil
- }
- // Scale updates a ReplicaSet to a new size, with optional precondition check (if preconditions is
- // not nil), optional retries (if retry is not nil), and then optionally waits for it's replica
- // count to reach the new value (if wait is not nil).
- func (scaler *ReplicaSetScaler) Scale(namespace, name string, newSize uint, preconditions *ScalePrecondition, retry, waitForReplicas *RetryParams) error {
- if preconditions == nil {
- preconditions = &ScalePrecondition{-1, ""}
- }
- if retry == nil {
- // Make it try only once, immediately
- retry = &RetryParams{Interval: time.Millisecond, Timeout: time.Millisecond}
- }
- cond := ScaleCondition(scaler, preconditions, namespace, name, newSize, nil)
- if err := wait.Poll(retry.Interval, retry.Timeout, cond); err != nil {
- return err
- }
- if waitForReplicas != nil {
- rs, err := scaler.c.ReplicaSets(namespace).Get(name)
- if err != nil {
- return err
- }
- err = wait.Poll(waitForReplicas.Interval, waitForReplicas.Timeout, client.ReplicaSetHasDesiredReplicas(scaler.c, rs))
- if err == wait.ErrWaitTimeout {
- return fmt.Errorf("timed out waiting for %q to be synced", name)
- }
- return err
- }
- return nil
- }
- // ValidateJob ensures that the preconditions match. Returns nil if they are valid, an error otherwise.
- func (precondition *ScalePrecondition) ValidateJob(job *batch.Job) error {
- if precondition.Size != -1 && job.Spec.Parallelism == nil {
- return PreconditionError{"parallelism", strconv.Itoa(precondition.Size), "nil"}
- }
- if precondition.Size != -1 && int(*job.Spec.Parallelism) != precondition.Size {
- return PreconditionError{"parallelism", strconv.Itoa(precondition.Size), strconv.Itoa(int(*job.Spec.Parallelism))}
- }
- if len(precondition.ResourceVersion) != 0 && job.ResourceVersion != precondition.ResourceVersion {
- return PreconditionError{"resource version", precondition.ResourceVersion, job.ResourceVersion}
- }
- return nil
- }
- type PetSetScaler struct {
- c client.AppsInterface
- }
- // ScaleSimple does a simple one-shot attempt at scaling. It returns the
- // resourceVersion of the petset if the update is successful.
- func (scaler *PetSetScaler) ScaleSimple(namespace, name string, preconditions *ScalePrecondition, newSize uint) (string, error) {
- ps, err := scaler.c.PetSets(namespace).Get(name)
- if err != nil {
- return "", ScaleError{ScaleGetFailure, "Unknown", err}
- }
- if preconditions != nil {
- if err := preconditions.ValidatePetSet(ps); err != nil {
- return "", err
- }
- }
- ps.Spec.Replicas = int(newSize)
- updatedPetSet, err := scaler.c.PetSets(namespace).Update(ps)
- if err != nil {
- if errors.IsConflict(err) {
- return "", ScaleError{ScaleUpdateConflictFailure, ps.ResourceVersion, err}
- }
- return "", ScaleError{ScaleUpdateFailure, ps.ResourceVersion, err}
- }
- return updatedPetSet.ResourceVersion, nil
- }
- func (scaler *PetSetScaler) Scale(namespace, name string, newSize uint, preconditions *ScalePrecondition, retry, waitForReplicas *RetryParams) error {
- if preconditions == nil {
- preconditions = &ScalePrecondition{-1, ""}
- }
- if retry == nil {
- // Make it try only once, immediately
- retry = &RetryParams{Interval: time.Millisecond, Timeout: time.Millisecond}
- }
- cond := ScaleCondition(scaler, preconditions, namespace, name, newSize, nil)
- if err := wait.Poll(retry.Interval, retry.Timeout, cond); err != nil {
- return err
- }
- if waitForReplicas != nil {
- job, err := scaler.c.PetSets(namespace).Get(name)
- if err != nil {
- return err
- }
- err = wait.Poll(waitForReplicas.Interval, waitForReplicas.Timeout, client.PetSetHasDesiredPets(scaler.c, job))
- if err == wait.ErrWaitTimeout {
- return fmt.Errorf("timed out waiting for %q to be synced", name)
- }
- return err
- }
- return nil
- }
- type JobScaler struct {
- c client.BatchInterface
- }
- // ScaleSimple is responsible for updating job's parallelism. It returns the
- // resourceVersion of the job if the update is successful.
- func (scaler *JobScaler) ScaleSimple(namespace, name string, preconditions *ScalePrecondition, newSize uint) (string, error) {
- job, err := scaler.c.Jobs(namespace).Get(name)
- if err != nil {
- return "", ScaleError{ScaleGetFailure, "Unknown", err}
- }
- if preconditions != nil {
- if err := preconditions.ValidateJob(job); err != nil {
- return "", err
- }
- }
- parallelism := int32(newSize)
- job.Spec.Parallelism = ¶llelism
- udpatedJob, err := scaler.c.Jobs(namespace).Update(job)
- if err != nil {
- if errors.IsConflict(err) {
- return "", ScaleError{ScaleUpdateConflictFailure, job.ResourceVersion, err}
- }
- return "", ScaleError{ScaleUpdateFailure, job.ResourceVersion, err}
- }
- return udpatedJob.ObjectMeta.ResourceVersion, nil
- }
- // Scale updates a Job to a new size, with optional precondition check (if preconditions is not nil),
- // optional retries (if retry is not nil), and then optionally waits for parallelism to reach desired
- // number, which can be less than requested based on job's current progress.
- func (scaler *JobScaler) Scale(namespace, name string, newSize uint, preconditions *ScalePrecondition, retry, waitForReplicas *RetryParams) error {
- if preconditions == nil {
- preconditions = &ScalePrecondition{-1, ""}
- }
- if retry == nil {
- // Make it try only once, immediately
- retry = &RetryParams{Interval: time.Millisecond, Timeout: time.Millisecond}
- }
- cond := ScaleCondition(scaler, preconditions, namespace, name, newSize, nil)
- if err := wait.Poll(retry.Interval, retry.Timeout, cond); err != nil {
- return err
- }
- if waitForReplicas != nil {
- job, err := scaler.c.Jobs(namespace).Get(name)
- if err != nil {
- return err
- }
- err = wait.Poll(waitForReplicas.Interval, waitForReplicas.Timeout, client.JobHasDesiredParallelism(scaler.c, job))
- if err == wait.ErrWaitTimeout {
- return fmt.Errorf("timed out waiting for %q to be synced", name)
- }
- return err
- }
- return nil
- }
- // ValidateDeployment ensures that the preconditions match. Returns nil if they are valid, an error otherwise.
- func (precondition *ScalePrecondition) ValidateDeployment(deployment *extensions.Deployment) error {
- if precondition.Size != -1 && int(deployment.Spec.Replicas) != precondition.Size {
- return PreconditionError{"replicas", strconv.Itoa(precondition.Size), strconv.Itoa(int(deployment.Spec.Replicas))}
- }
- if len(precondition.ResourceVersion) != 0 && deployment.ResourceVersion != precondition.ResourceVersion {
- return PreconditionError{"resource version", precondition.ResourceVersion, deployment.ResourceVersion}
- }
- return nil
- }
- type DeploymentScaler struct {
- c client.ExtensionsInterface
- }
- // ScaleSimple is responsible for updating a deployment's desired replicas
- // count. It returns the resourceVersion of the deployment if the update is
- // successful.
- func (scaler *DeploymentScaler) ScaleSimple(namespace, name string, preconditions *ScalePrecondition, newSize uint) (string, error) {
- deployment, err := scaler.c.Deployments(namespace).Get(name)
- if err != nil {
- return "", ScaleError{ScaleGetFailure, "Unknown", err}
- }
- if preconditions != nil {
- if err := preconditions.ValidateDeployment(deployment); err != nil {
- return "", err
- }
- }
- // TODO(madhusudancs): Fix this when Scale group issues are resolved (see issue #18528).
- // For now I'm falling back to regular Deployment update operation.
- deployment.Spec.Replicas = int32(newSize)
- updatedDeployment, err := scaler.c.Deployments(namespace).Update(deployment)
- if err != nil {
- if errors.IsConflict(err) {
- return "", ScaleError{ScaleUpdateConflictFailure, deployment.ResourceVersion, err}
- }
- return "", ScaleError{ScaleUpdateFailure, deployment.ResourceVersion, err}
- }
- return updatedDeployment.ObjectMeta.ResourceVersion, nil
- }
- // Scale updates a deployment to a new size, with optional precondition check (if preconditions is not nil),
- // optional retries (if retry is not nil), and then optionally waits for the status to reach desired count.
- func (scaler *DeploymentScaler) Scale(namespace, name string, newSize uint, preconditions *ScalePrecondition, retry, waitForReplicas *RetryParams) error {
- if preconditions == nil {
- preconditions = &ScalePrecondition{-1, ""}
- }
- if retry == nil {
- // Make it try only once, immediately
- retry = &RetryParams{Interval: time.Millisecond, Timeout: time.Millisecond}
- }
- cond := ScaleCondition(scaler, preconditions, namespace, name, newSize, nil)
- if err := wait.Poll(retry.Interval, retry.Timeout, cond); err != nil {
- return err
- }
- if waitForReplicas != nil {
- deployment, err := scaler.c.Deployments(namespace).Get(name)
- if err != nil {
- return err
- }
- err = wait.Poll(waitForReplicas.Interval, waitForReplicas.Timeout, client.DeploymentHasDesiredReplicas(scaler.c, deployment))
- if err == wait.ErrWaitTimeout {
- return fmt.Errorf("timed out waiting for %q to be synced", name)
- }
- return err
- }
- return nil
- }
|