From 86c2709082310ca48d0939bd78a9a55505a37ddb Mon Sep 17 00:00:00 2001 From: druppelt <44848632+druppelt@users.noreply.github.com> Date: Sat, 14 Sep 2024 14:15:18 +0200 Subject: [PATCH] fix: correctly calculate maxReplicas for rollingUpdate deployments & rolling DeploymentConfigs Correctly calculate the maxReplicas as `replicas + maxSurge` instead of `replicas + maxSurge - maxUnavailable` Refs: #20 --- internal/calc/deployment.go | 39 +++++++++++++++----------- internal/calc/deploymentConfig.go | 38 ++++++++++++++----------- internal/calc/deploymentConfig_test.go | 10 +++---- internal/calc/deployment_test.go | 30 ++++++++++---------- 4 files changed, 65 insertions(+), 52 deletions(-) diff --git a/internal/calc/deployment.go b/internal/calc/deployment.go index 090c0de..5c26144 100644 --- a/internal/calc/deployment.go +++ b/internal/calc/deployment.go @@ -1,6 +1,7 @@ package calc import ( + "errors" "fmt" "math" @@ -10,10 +11,10 @@ import ( // calculates the cpu/memory resources a single deployment needs. Replicas and the deployment // strategy are taken into account. -func deployment(deployment appsv1.Deployment) (*ResourceUsage, error) { +func deployment(deployment appsv1.Deployment) (*ResourceUsage, error) { //nolint:funlen // disable function length linting var ( - resourceOverhead float64 // max overhead compute resources (percent) - podOverhead int32 // max overhead pods during deployment + maxUnavailable int32 // max amount of unavailable pods during a deployment + maxSurge int32 // max amount of pods that are allowed in addition to replicas during deployment ) replicas := deployment.Spec.Replicas @@ -35,9 +36,9 @@ func deployment(deployment appsv1.Deployment) (*ResourceUsage, error) { switch strategy.Type { case appsv1.RecreateDeploymentStrategyType: - // no overhead on recreate - resourceOverhead = 1 - podOverhead = 0 + // kill all existing pods, then recreate new ones at once -> no overhead on recreate + maxUnavailable = *replicas + maxSurge = 0 case "": // RollingUpdate is the default and can be an empty string. If so, set the defaults // (https://pkg.go.dev/k8s.io/api/apps/v1?tab=doc#RollingUpdateDeployment) and continue calculation. @@ -69,31 +70,37 @@ func deployment(deployment appsv1.Deployment) (*ResourceUsage, error) { } // docs say, that the absolute number is calculated by rounding down. - maxUnavailable, err := intstr.GetScaledValueFromIntOrPercent(&maxUnavailableValue, int(*replicas), false) + maxUnavailableInt, err := intstr.GetScaledValueFromIntOrPercent(&maxUnavailableValue, int(*replicas), false) if err != nil { return nil, err } + if maxUnavailableInt < math.MinInt32 || maxUnavailableInt > math.MaxInt32 { + return nil, errors.New("maxUnavailableInt out of int32 boundaries") + } + + maxUnavailable = int32(maxUnavailableInt) + // docs say, absolute number is calculated by rounding up. - maxSurge, err := intstr.GetScaledValueFromIntOrPercent(&maxSurgeValue, int(*replicas), true) + maxSurgeInt, err := intstr.GetScaledValueFromIntOrPercent(&maxSurgeValue, int(*replicas), true) if err != nil { return nil, err } - // podOverhead is the number of pods which can run more during a deployment - podOverheadInt := maxSurge - maxUnavailable - if podOverheadInt > math.MaxInt32 || podOverheadInt < math.MinInt32 { - return nil, fmt.Errorf("deployment: %s maxSurge - maxUnavailable (%d-%d) was out of bounds for int32", deployment.Name, maxSurge, maxUnavailable) + if maxSurgeInt < math.MinInt32 || maxSurgeInt > math.MaxInt32 { + return nil, errors.New("maxSurgeInt out of int32 boundaries") } - podOverhead = int32(podOverheadInt) //nolint:gosec,wsl // gosec doesn't understand that the int conversion is already guarded, wsl wants to group the assignment with the next block - resourceOverhead = (float64(podOverhead) / float64(*replicas)) + 1 + maxSurge = int32(maxSurgeInt) + default: return nil, fmt.Errorf("deployment: %s deployment strategy %q is unknown", deployment.Name, strategy.Type) } + _ = maxUnavailable // fix complaining compiler. will need this field in the future + podResources := podResources(&deployment.Spec.Template.Spec) - newResources := podResources.Mul(float64(*replicas)).Mul(resourceOverhead) + newResources := podResources.Mul(float64(*replicas + maxSurge)) resourceUsage := ResourceUsage{ Resources: newResources, @@ -103,7 +110,7 @@ func deployment(deployment appsv1.Deployment) (*ResourceUsage, error) { Name: deployment.Name, Replicas: *replicas, Strategy: string(strategy.Type), - MaxReplicas: *replicas + podOverhead, + MaxReplicas: *replicas + maxSurge, }, } diff --git a/internal/calc/deploymentConfig.go b/internal/calc/deploymentConfig.go index 85ee4b8..d9cea28 100644 --- a/internal/calc/deploymentConfig.go +++ b/internal/calc/deploymentConfig.go @@ -1,6 +1,7 @@ package calc import ( + "errors" "fmt" "math" @@ -10,10 +11,10 @@ import ( // calculates the cpu/memory resources a single deployment needs. Replicas and the deployment // strategy are taken into account. -func deploymentConfig(deploymentConfig openshiftAppsV1.DeploymentConfig) (*ResourceUsage, error) { +func deploymentConfig(deploymentConfig openshiftAppsV1.DeploymentConfig) (*ResourceUsage, error) { //nolint:funlen // disable function length linting var ( - resourceOverhead float64 // max overhead compute resources (percent) - podOverhead int32 // max overhead pods during deploymentConfig + maxUnavailable int32 // max amount of unavailable pods during a deployment + maxSurge int32 // max amount of pods that are allowed in addition to replicas during deployment ) replicas := deploymentConfig.Spec.Replicas @@ -35,9 +36,9 @@ func deploymentConfig(deploymentConfig openshiftAppsV1.DeploymentConfig) (*Resou // TODO lookup default values, these are copied from kubernetes Deployment switch strategy.Type { case openshiftAppsV1.DeploymentStrategyTypeRecreate: - // no overhead on recreate - resourceOverhead = 1 - podOverhead = 0 + // kill all existing pods, then recreate new ones at once -> no overhead on recreate + maxUnavailable = replicas + maxSurge = 0 case "": // Rolling is the default and can be an empty string. If so, set the defaults // (https://pkg.go.dev/k8s.io/api/apps/v1?tab=doc#RollingUpdateDeployment) and continue calculation. @@ -69,32 +70,37 @@ func deploymentConfig(deploymentConfig openshiftAppsV1.DeploymentConfig) (*Resou } // docs say, that the absolute number is calculated by rounding down. - maxUnavailable, err := intstr.GetScaledValueFromIntOrPercent(&maxUnavailableValue, int(replicas), false) + maxUnavailableInt, err := intstr.GetScaledValueFromIntOrPercent(&maxUnavailableValue, int(replicas), false) if err != nil { return nil, err } + if maxUnavailableInt < math.MinInt32 || maxUnavailableInt > math.MaxInt32 { + return nil, errors.New("maxUnavailableInt out of int32 boundaries") + } + + maxUnavailable = int32(maxUnavailableInt) + // docs say, absolute number is calculated by rounding up. - maxSurge, err := intstr.GetScaledValueFromIntOrPercent(&maxSurgeValue, int(replicas), true) + maxSurgeInt, err := intstr.GetScaledValueFromIntOrPercent(&maxSurgeValue, int(replicas), true) if err != nil { return nil, err } - // podOverhead is the number of pods which can run more during a deployment - podOverheadInt := maxSurge - maxUnavailable - if podOverheadInt > math.MaxInt32 || podOverheadInt < math.MinInt32 { - return nil, fmt.Errorf("deploymentConfig: %s maxSurge - maxUnavailable (%d-%d) was out of bounds for int32", deploymentConfig.Name, maxSurge, maxUnavailable) + if maxSurgeInt < math.MinInt32 || maxSurgeInt > math.MaxInt32 { + return nil, errors.New("maxSurgeInt out of int32 boundaries") } - podOverhead = int32(podOverheadInt) //nolint:gosec,wsl // gosec doesn't understand that the int conversion is already guarded, wsl wants to group the assignment with the next block - resourceOverhead = (float64(podOverhead) / float64(replicas)) + 1 + maxSurge = int32(maxSurgeInt) default: return nil, fmt.Errorf("deploymentConfig: %s deploymentConfig strategy %q is unknown", deploymentConfig.Name, strategy.Type) } + _ = maxUnavailable // fix complaining compiler. will need this field in the future + podResources := podResources(&deploymentConfig.Spec.Template.Spec) strategyResources := ConvertToResources(&deploymentConfig.Spec.Strategy.Resources) - newResources := podResources.Mul(float64(replicas)).Mul(resourceOverhead).Add(strategyResources) + newResources := podResources.Mul(float64(replicas + maxSurge)).Add(strategyResources) resourceUsage := ResourceUsage{ Resources: newResources, @@ -104,7 +110,7 @@ func deploymentConfig(deploymentConfig openshiftAppsV1.DeploymentConfig) (*Resou Name: deploymentConfig.Name, Replicas: replicas, Strategy: string(strategy.Type), - MaxReplicas: replicas + podOverhead, + MaxReplicas: replicas + maxSurge, }, } diff --git a/internal/calc/deploymentConfig_test.go b/internal/calc/deploymentConfig_test.go index acbd569..e65d972 100644 --- a/internal/calc/deploymentConfig_test.go +++ b/internal/calc/deploymentConfig_test.go @@ -23,12 +23,12 @@ func TestDeploymentConfig(t *testing.T) { { name: "normal deploymentConfig", deploymentConfig: normalDeploymentConfig, - cpuMin: resource.MustParse("2750m"), - cpuMax: resource.MustParse("5500m"), - memoryMin: resource.MustParse("22Gi"), - memoryMax: resource.MustParse("44Gi"), + cpuMin: resource.MustParse("3250m"), + cpuMax: resource.MustParse("6500m"), + memoryMin: resource.MustParse("26Gi"), + memoryMax: resource.MustParse("52Gi"), replicas: 10, - maxReplicas: 11, + maxReplicas: 13, strategy: openshiftAppsV1.DeploymentStrategyTypeRolling, }, //TODO add more tests diff --git a/internal/calc/deployment_test.go b/internal/calc/deployment_test.go index ed308d2..5f666e7 100644 --- a/internal/calc/deployment_test.go +++ b/internal/calc/deployment_test.go @@ -23,23 +23,23 @@ func TestDeployment(t *testing.T) { { name: "normal deployment", deployment: normalDeployment, - cpuMin: resource.MustParse("2750m"), - cpuMax: resource.MustParse("5500m"), - memoryMin: resource.MustParse("22Gi"), - memoryMax: resource.MustParse("44Gi"), + cpuMin: resource.MustParse("3250m"), + cpuMax: resource.MustParse("6500m"), + memoryMin: resource.MustParse("26Gi"), + memoryMax: resource.MustParse("52Gi"), replicas: 10, - maxReplicas: 11, + maxReplicas: 13, strategy: appsv1.RollingUpdateDeploymentStrategyType, }, { name: "deployment without strategy", deployment: deploymentWithoutStrategy, - cpuMin: resource.MustParse("2750m"), - cpuMax: resource.MustParse("11"), - memoryMin: resource.MustParse("22Gi"), - memoryMax: resource.MustParse("44Gi"), + cpuMin: resource.MustParse("3250m"), + cpuMax: resource.MustParse("13"), + memoryMin: resource.MustParse("26Gi"), + memoryMax: resource.MustParse("52Gi"), replicas: 10, - maxReplicas: 11, + maxReplicas: 13, strategy: appsv1.RollingUpdateDeploymentStrategyType, }, { @@ -78,12 +78,12 @@ func TestDeployment(t *testing.T) { { name: "deployment without max unavailable/surge values", deployment: deploymentWithoutValues, - cpuMin: resource.MustParse("2750m"), - cpuMax: resource.MustParse("11"), - memoryMin: resource.MustParse("22Gi"), - memoryMax: resource.MustParse("44Gi"), + cpuMin: resource.MustParse("3250m"), + cpuMax: resource.MustParse("13"), + memoryMin: resource.MustParse("26Gi"), + memoryMax: resource.MustParse("52Gi"), replicas: 10, - maxReplicas: 11, + maxReplicas: 13, strategy: appsv1.RollingUpdateDeploymentStrategyType, }, {