Skip to content

Commit

Permalink
scheduler: add downgrade strategy for empty 'aggregated' on cold koor… (
Browse files Browse the repository at this point in the history
#2239)

Signed-off-by: clay-wangzhi <[email protected]>
  • Loading branch information
clay-wangzhi authored Nov 7, 2024
1 parent 6fc4205 commit 81dfad9
Show file tree
Hide file tree
Showing 2 changed files with 188 additions and 6 deletions.
18 changes: 12 additions & 6 deletions pkg/scheduler/plugins/loadaware/helper.go
Original file line number Diff line number Diff line change
Expand Up @@ -60,20 +60,26 @@ func getTargetAggregatedUsage(nodeMetric *slov1alpha1.NodeMetric, aggregatedDura
return nil
}

// If no specific period is set, the maximum period recorded by NodeMetrics will be used by default.
// If no specific period is set, the non-empty maximum period recorded by NodeMetrics will be used by default.
// This is a default policy.
if aggregatedDuration == nil || aggregatedDuration.Duration == 0 {
var maxDuration time.Duration
var maxIndex int
var maxIndex int = -1
for i, v := range nodeMetric.Status.NodeMetric.AggregatedNodeUsages {
if v.Duration.Duration > maxDuration {
if len(v.Usage[aggregationType].ResourceList) > 0 && v.Duration.Duration > maxDuration {
maxDuration = v.Duration.Duration
maxIndex = i
}
}
aggregatedNodeUsage := &nodeMetric.Status.NodeMetric.AggregatedNodeUsages[maxIndex]
usage := aggregatedNodeUsage.Usage[aggregationType]
if len(usage.ResourceList) > 0 {

if maxIndex == -1 {
// All values in aggregatedDuration are empty, downgrade to use the values in NodeUsage
usage := nodeMetric.Status.NodeMetric.NodeUsage
if len(usage.ResourceList) > 0 {
return &usage
}
} else {
usage := nodeMetric.Status.NodeMetric.AggregatedNodeUsages[maxIndex].Usage[aggregationType]
return &usage
}
} else if aggregatedDuration != nil {
Expand Down
176 changes: 176 additions & 0 deletions pkg/scheduler/plugins/loadaware/helper_test.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,176 @@
/*
Copyright 2022 The Koordinator Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package loadaware

import (
"testing"
"time"

"github.com/stretchr/testify/assert"
corev1 "k8s.io/api/core/v1"
"k8s.io/apimachinery/pkg/api/resource"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"

"github.com/koordinator-sh/koordinator/apis/extension"
slov1alpha1 "github.com/koordinator-sh/koordinator/apis/slo/v1alpha1"
)

// Test cases description:
// 1. When nodeMetric contains valid AggregatedNodeUsages and aggregatedDuration is nil, it should return the non-empty longest duration resource usage.
// 2. When aggregatedDuration is not nil and matches a duration in AggregatedNodeUsages, it should return the corresponding resource usage.
// 3. When nodeMetric's NodeUsage contains a valid resource list and AggregatedNodeUsages is empty, it should return the resource usage of NodeUsage.

func TestGetTargetAggregatedUsage(t *testing.T) {
aggregationType := extension.P95
tests := []struct {
name string
nodeMetric *slov1alpha1.NodeMetric
aggregatedDuration *metav1.Duration

expectedResult *slov1alpha1.ResourceMap
}{
{
name: "Valid AggregatedNodeUsages and aggregatedDuration is nil",
nodeMetric: &slov1alpha1.NodeMetric{
Status: slov1alpha1.NodeMetricStatus{
NodeMetric: &slov1alpha1.NodeMetricInfo{
AggregatedNodeUsages: []slov1alpha1.AggregatedUsage{
{
Duration: metav1.Duration{Duration: 5 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("30"),
},
},
},
},
{
Duration: metav1.Duration{Duration: 10 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("50"),
},
},
},
},
{
Duration: metav1.Duration{Duration: 15 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: nil,
},
},
},
},
},
},
},
aggregatedDuration: nil,
expectedResult: &slov1alpha1.ResourceMap{
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("50"),
},
},
},
{
name: "aggregatedDuration is not nil and matches a duration",
nodeMetric: &slov1alpha1.NodeMetric{
Status: slov1alpha1.NodeMetricStatus{
NodeMetric: &slov1alpha1.NodeMetricInfo{
AggregatedNodeUsages: []slov1alpha1.AggregatedUsage{
{
Duration: metav1.Duration{Duration: 5 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("30"),
},
},
},
},
{
Duration: metav1.Duration{Duration: 10 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("50"),
},
},
},
},
{
Duration: metav1.Duration{Duration: 15 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("70"),
},
},
},
},
},
},
},
},
aggregatedDuration: &metav1.Duration{Duration: 5 * time.Minute},
expectedResult: &slov1alpha1.ResourceMap{
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("30"),
},
},
},
{
name: "NodeUsage contains a valid resource list and AggregatedNodeUsages is empty",
nodeMetric: &slov1alpha1.NodeMetric{
Status: slov1alpha1.NodeMetricStatus{
NodeMetric: &slov1alpha1.NodeMetricInfo{
NodeUsage: slov1alpha1.ResourceMap{
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("30"),
},
},
AggregatedNodeUsages: []slov1alpha1.AggregatedUsage{
{
Duration: metav1.Duration{Duration: 5 * time.Minute},
Usage: map[extension.AggregationType]slov1alpha1.ResourceMap{
aggregationType: {
ResourceList: nil,
},
},
},
},
},
},
},
aggregatedDuration: nil,
expectedResult: &slov1alpha1.ResourceMap{
ResourceList: corev1.ResourceList{
corev1.ResourceCPU: resource.MustParse("30"),
},
},
},
}

for _, tt := range tests {
t.Run(tt.name, func(t *testing.T) {
result := getTargetAggregatedUsage(tt.nodeMetric, tt.aggregatedDuration, aggregationType)
assert.Equal(t, tt.expectedResult, result)
})
}
}

0 comments on commit 81dfad9

Please sign in to comment.