From 0ec9524244bb805de7f62e1a30fa0cf105b47273 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Kuba=20Tu=C5=BCnik?= Date: Mon, 30 Sep 2024 21:20:49 +0200 Subject: [PATCH] TMP squash: #7479, #7497, #7529 DONOTSUBMIT --- .../config/autoscaling_options.go | 2 + .../context/autoscaling_context.go | 11 +- cluster-autoscaler/core/autoscaler.go | 17 +- .../currently_drained_nodes_test.go | 15 +- .../podlistprocessor/filter_out_expendable.go | 1 + .../filter_out_expendable_test.go | 7 +- .../filter_out_schedulable.go | 5 +- .../filter_out_schedulable_test.go | 28 +- .../podlistprocessor/pod_list_processor.go | 5 +- .../core/scaledown/actuation/actuator.go | 7 +- .../core/scaledown/actuation/actuator_test.go | 4 +- .../core/scaledown/actuation/drain_test.go | 4 +- .../core/scaledown/eligibility/eligibility.go | 2 +- .../scaledown/eligibility/eligibility_test.go | 9 +- .../core/scaledown/planner/planner.go | 4 +- .../core/scaledown/planner/planner_test.go | 4 +- .../core/scaledown/unneeded/nodes_test.go | 7 +- .../scaleup/orchestrator/async_initializer.go | 4 +- .../core/scaleup/orchestrator/orchestrator.go | 11 +- .../scaleup/orchestrator/orchestrator_test.go | 51 +- .../core/scaleup/resource/manager_test.go | 13 +- cluster-autoscaler/core/static_autoscaler.go | 11 +- .../core/static_autoscaler_test.go | 68 ++- cluster-autoscaler/core/test/common.go | 13 +- cluster-autoscaler/core/utils/utils.go | 77 --- cluster-autoscaler/core/utils/utils_test.go | 29 - .../estimator/binpacking_estimator.go | 52 +- .../estimator/binpacking_estimator_test.go | 22 +- cluster-autoscaler/estimator/estimator.go | 6 +- cluster-autoscaler/go.mod | 59 -- cluster-autoscaler/main.go | 23 +- .../mixed_nodeinfos_processor.go | 42 +- .../mixed_nodeinfos_processor_test.go | 55 +- .../nodes/scale_down_set_processor_test.go | 3 +- .../pod_injection_processor_test.go | 5 +- .../processors/provreq/processor.go | 5 +- .../processors/provreq/processor_test.go | 7 +- cluster-autoscaler/processors/test/common.go | 2 +- .../orchestrator/orchestrator.go | 2 +- .../orchestrator/orchestrator_test.go | 4 - cluster-autoscaler/simulator/cluster.go | 8 +- cluster-autoscaler/simulator/cluster_test.go | 25 +- .../clustersnapshot/{ => base}/basic.go | 103 ++-- .../clustersnapshot/{ => base}/delta.go | 99 ++-- .../base/delta_benchmark_test.go | 88 +++ .../clustersnapshot/clustersnapshot.go | 63 ++- .../simulator/clustersnapshot/error.go | 149 +++++ .../predicate/plugin_runner.go | 138 +++++ .../predicate/plugin_runner_test.go | 337 ++++++++++++ .../predicate/predicate_snapshot.go | 107 ++++ .../predicate_snapshot_benchmark_test.go} | 143 +---- .../predicate_snapshot_test.go} | 142 +++-- .../simulator/clustersnapshot/test_utils.go | 52 +- .../testsnapshot/test_snapshot.go | 65 +++ .../dynamicresources/snapshot/snapshot.go | 48 ++ .../framework/delegating_shared_lister.go | 182 +++++++ .../simulator/framework/handle.go | 99 ++++ .../simulator/framework/infos.go | 54 +- .../simulator/framework/infos_test.go | 82 ++- .../simulator/framework/test_utils.go | 32 +- .../simulator/node_info_utils.go | 153 ++++++ .../simulator/node_info_utils_test.go | 510 ++++++++++++++++++ cluster-autoscaler/simulator/nodes.go | 71 --- cluster-autoscaler/simulator/nodes_test.go | 239 -------- .../delegating_shared_lister.go | 96 ---- .../simulator/predicatechecker/error.go | 107 ---- .../simulator/predicatechecker/interface.go | 31 -- .../predicatechecker/schedulerbased.go | 198 ------- .../predicatechecker/schedulerbased_test.go | 322 ----------- .../simulator/predicatechecker/testchecker.go | 45 -- .../simulator/scheduling/hinting_simulator.go | 60 +-- .../scheduling/hinting_simulator_test.go | 23 +- .../utils/daemonset/daemonset.go | 5 + .../utils/scheduler/scheduler.go | 22 - 74 files changed, 2643 insertions(+), 1951 deletions(-) rename cluster-autoscaler/simulator/clustersnapshot/{ => base}/basic.go (73%) rename cluster-autoscaler/simulator/clustersnapshot/{ => base}/delta.go (81%) create mode 100644 cluster-autoscaler/simulator/clustersnapshot/base/delta_benchmark_test.go create mode 100644 cluster-autoscaler/simulator/clustersnapshot/error.go create mode 100644 cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner.go create mode 100644 cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner_test.go create mode 100644 cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot.go rename cluster-autoscaler/simulator/clustersnapshot/{clustersnapshot_benchmark_test.go => predicate/predicate_snapshot_benchmark_test.go} (53%) rename cluster-autoscaler/simulator/clustersnapshot/{clustersnapshot_test.go => predicate/predicate_snapshot_test.go} (81%) create mode 100644 cluster-autoscaler/simulator/clustersnapshot/testsnapshot/test_snapshot.go create mode 100644 cluster-autoscaler/simulator/dynamicresources/snapshot/snapshot.go create mode 100644 cluster-autoscaler/simulator/framework/delegating_shared_lister.go create mode 100644 cluster-autoscaler/simulator/framework/handle.go create mode 100644 cluster-autoscaler/simulator/node_info_utils.go create mode 100644 cluster-autoscaler/simulator/node_info_utils_test.go delete mode 100644 cluster-autoscaler/simulator/nodes.go delete mode 100644 cluster-autoscaler/simulator/nodes_test.go delete mode 100644 cluster-autoscaler/simulator/predicatechecker/delegating_shared_lister.go delete mode 100644 cluster-autoscaler/simulator/predicatechecker/error.go delete mode 100644 cluster-autoscaler/simulator/predicatechecker/interface.go delete mode 100644 cluster-autoscaler/simulator/predicatechecker/schedulerbased.go delete mode 100644 cluster-autoscaler/simulator/predicatechecker/schedulerbased_test.go delete mode 100644 cluster-autoscaler/simulator/predicatechecker/testchecker.go diff --git a/cluster-autoscaler/config/autoscaling_options.go b/cluster-autoscaler/config/autoscaling_options.go index aa902058c184..ed4a8b645801 100644 --- a/cluster-autoscaler/config/autoscaling_options.go +++ b/cluster-autoscaler/config/autoscaling_options.go @@ -309,6 +309,8 @@ type AutoscalingOptions struct { CheckCapacityProvisioningRequestBatchTimebox time.Duration // ForceDeleteLongUnregisteredNodes is used to enable/disable ignoring min size constraints during removal of long unregistered nodes ForceDeleteLongUnregisteredNodes bool + // DynamicResourceAllocationEnabled configures whether logic for handling DRA objects is enabled. + DynamicResourceAllocationEnabled bool } // KubeClientOptions specify options for kube client diff --git a/cluster-autoscaler/context/autoscaling_context.go b/cluster-autoscaler/context/autoscaling_context.go index 1743e8c443c9..31e2af8f4fce 100644 --- a/cluster-autoscaler/context/autoscaling_context.go +++ b/cluster-autoscaler/context/autoscaling_context.go @@ -27,7 +27,7 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/expander" processor_callbacks "k8s.io/autoscaler/cluster-autoscaler/processors/callbacks" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" "k8s.io/client-go/informers" kube_client "k8s.io/client-go/kubernetes" @@ -44,9 +44,8 @@ type AutoscalingContext struct { AutoscalingKubeClients // CloudProvider used in CA. CloudProvider cloudprovider.CloudProvider - // TODO(kgolab) - move away too as it's not config - // PredicateChecker to check if a pod can fit into a node. - PredicateChecker predicatechecker.PredicateChecker + // FrameworkHandle can be used to interact with the scheduler framework. + FrameworkHandle *framework.Handle // ClusterSnapshot denotes cluster snapshot used for predicate checking. ClusterSnapshot clustersnapshot.ClusterSnapshot // ExpanderStrategy is the strategy used to choose which node group to expand when scaling up @@ -100,7 +99,7 @@ func NewResourceLimiterFromAutoscalingOptions(options config.AutoscalingOptions) // NewAutoscalingContext returns an autoscaling context from all the necessary parameters passed via arguments func NewAutoscalingContext( options config.AutoscalingOptions, - predicateChecker predicatechecker.PredicateChecker, + fwHandle *framework.Handle, clusterSnapshot clustersnapshot.ClusterSnapshot, autoscalingKubeClients *AutoscalingKubeClients, cloudProvider cloudprovider.CloudProvider, @@ -114,7 +113,7 @@ func NewAutoscalingContext( AutoscalingOptions: options, CloudProvider: cloudProvider, AutoscalingKubeClients: *autoscalingKubeClients, - PredicateChecker: predicateChecker, + FrameworkHandle: fwHandle, ClusterSnapshot: clusterSnapshot, ExpanderStrategy: expanderStrategy, ProcessorCallbacks: processorCallbacks, diff --git a/cluster-autoscaler/core/autoscaler.go b/cluster-autoscaler/core/autoscaler.go index 0e63a3c85011..42e98897733b 100644 --- a/cluster-autoscaler/core/autoscaler.go +++ b/cluster-autoscaler/core/autoscaler.go @@ -33,9 +33,11 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/observers/loopstart" ca_processors "k8s.io/autoscaler/cluster-autoscaler/processors" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/predicate" "k8s.io/autoscaler/cluster-autoscaler/simulator/drainability/rules" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/simulator/options" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/utils/backoff" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" "k8s.io/client-go/informers" @@ -49,7 +51,7 @@ type AutoscalerOptions struct { InformerFactory informers.SharedInformerFactory AutoscalingKubeClients *context.AutoscalingKubeClients CloudProvider cloudprovider.CloudProvider - PredicateChecker predicatechecker.PredicateChecker + FrameworkHandle *framework.Handle ClusterSnapshot clustersnapshot.ClusterSnapshot ExpanderStrategy expander.Strategy EstimatorBuilder estimator.EstimatorBuilder @@ -86,7 +88,7 @@ func NewAutoscaler(opts AutoscalerOptions, informerFactory informers.SharedInfor } return NewStaticAutoscaler( opts.AutoscalingOptions, - opts.PredicateChecker, + opts.FrameworkHandle, opts.ClusterSnapshot, opts.AutoscalingKubeClients, opts.Processors, @@ -114,8 +116,15 @@ func initializeDefaultOptions(opts *AutoscalerOptions, informerFactory informers if opts.AutoscalingKubeClients == nil { opts.AutoscalingKubeClients = context.NewAutoscalingKubeClients(opts.AutoscalingOptions, opts.KubeClient, opts.InformerFactory) } + if opts.FrameworkHandle == nil { + fwHandle, err := framework.NewHandle(opts.InformerFactory, opts.SchedulerConfig, opts.DynamicResourceAllocationEnabled) + if err != nil { + return err + } + opts.FrameworkHandle = fwHandle + } if opts.ClusterSnapshot == nil { - opts.ClusterSnapshot = clustersnapshot.NewBasicClusterSnapshot() + opts.ClusterSnapshot = predicate.NewPredicateSnapshot(base.NewBasicSnapshotBase(), opts.FrameworkHandle, opts.DynamicResourceAllocationEnabled) } if opts.RemainingPdbTracker == nil { opts.RemainingPdbTracker = pdb.NewBasicRemainingPdbTracker() diff --git a/cluster-autoscaler/core/podlistprocessor/currently_drained_nodes_test.go b/cluster-autoscaler/core/podlistprocessor/currently_drained_nodes_test.go index 0aebcbd4d671..ae41f5127c54 100644 --- a/cluster-autoscaler/core/podlistprocessor/currently_drained_nodes_test.go +++ b/cluster-autoscaler/core/podlistprocessor/currently_drained_nodes_test.go @@ -26,6 +26,7 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/core/scaledown" "k8s.io/autoscaler/cluster-autoscaler/core/scaledown/status" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" ) @@ -194,7 +195,7 @@ func TestCurrentlyDrainedNodesPodListProcessor(t *testing.T) { name: "single node, non-recreatable pods filtered out", drainedNodes: []string{"n"}, nodes: []*apiv1.Node{ - BuildTestNode("n", 1000, 10), + BuildTestNode("n", 2000, 10), }, pods: []*apiv1.Pod{ BuildScheduledTestPod("p1", 100, 1, "n"), @@ -229,11 +230,11 @@ func TestCurrentlyDrainedNodesPodListProcessor(t *testing.T) { name: "everything works together", drainedNodes: []string{"n1", "n3", "n5"}, nodes: []*apiv1.Node{ - BuildTestNode("n1", 1000, 10), - BuildTestNode("n2", 1000, 10), - BuildTestNode("n3", 1000, 10), - BuildTestNode("n4", 1000, 10), - BuildTestNode("n5", 1000, 10), + BuildTestNode("n1", 3000, 10), + BuildTestNode("n2", 3000, 10), + BuildTestNode("n3", 3000, 10), + BuildTestNode("n4", 3000, 10), + BuildTestNode("n5", 3000, 10), }, pods: []*apiv1.Pod{ BuildScheduledTestPod("p1", 100, 1, "n1"), @@ -267,7 +268,7 @@ func TestCurrentlyDrainedNodesPodListProcessor(t *testing.T) { t.Run(tc.name, func(t *testing.T) { ctx := context.AutoscalingContext{ ScaleDownActuator: &mockActuator{&mockActuationStatus{tc.drainedNodes}}, - ClusterSnapshot: clustersnapshot.NewBasicClusterSnapshot(), + ClusterSnapshot: testsnapshot.NewTestSnapshotOrDie(t), } clustersnapshot.InitializeClusterSnapshotOrDie(t, ctx.ClusterSnapshot, tc.nodes, tc.pods) diff --git a/cluster-autoscaler/core/podlistprocessor/filter_out_expendable.go b/cluster-autoscaler/core/podlistprocessor/filter_out_expendable.go index 550f8a10520f..faba2261ba60 100644 --- a/cluster-autoscaler/core/podlistprocessor/filter_out_expendable.go +++ b/cluster-autoscaler/core/podlistprocessor/filter_out_expendable.go @@ -56,6 +56,7 @@ func (p *filterOutExpendable) Process(context *context.AutoscalingContext, pods // CA logic from before migration to scheduler framework. So let's keep it for now func (p *filterOutExpendable) addPreemptingPodsToSnapshot(pods []*apiv1.Pod, ctx *context.AutoscalingContext) error { for _, p := range pods { + // TODO(DRA): Figure out if/how to use the predicate-checking SchedulePod() here instead - otherwise this doesn't work with DRA pods. if err := ctx.ClusterSnapshot.ForceAddPod(p, p.Status.NominatedNodeName); err != nil { klog.Errorf("Failed to update snapshot with pod %s/%s waiting for preemption: %v", p.Namespace, p.Name, err) return caerrors.ToAutoscalerError(caerrors.InternalError, err) diff --git a/cluster-autoscaler/core/podlistprocessor/filter_out_expendable_test.go b/cluster-autoscaler/core/podlistprocessor/filter_out_expendable_test.go index 94f6915e3028..1ac006c6d065 100644 --- a/cluster-autoscaler/core/podlistprocessor/filter_out_expendable_test.go +++ b/cluster-autoscaler/core/podlistprocessor/filter_out_expendable_test.go @@ -25,7 +25,8 @@ import ( apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/config" "k8s.io/autoscaler/cluster-autoscaler/context" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" "k8s.io/autoscaler/cluster-autoscaler/utils/test" ) @@ -109,8 +110,8 @@ func TestFilterOutExpendable(t *testing.T) { for _, tc := range testCases { t.Run(tc.name, func(t *testing.T) { processor := NewFilterOutExpendablePodListProcessor() - snapshot := clustersnapshot.NewBasicClusterSnapshot() - err := snapshot.SetClusterState(tc.nodes, nil) + snapshot := testsnapshot.NewTestSnapshotOrDie(t) + err := snapshot.SetClusterState(tc.nodes, nil, drasnapshot.Snapshot{}) assert.NoError(t, err) pods, err := processor.Process(&context.AutoscalingContext{ diff --git a/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable.go b/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable.go index f56fb19d98c0..3283cdeda2d8 100644 --- a/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable.go +++ b/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable.go @@ -26,7 +26,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/metrics" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/simulator/scheduling" corev1helpers "k8s.io/component-helpers/scheduling/corev1" klog "k8s.io/klog/v2" @@ -38,9 +37,9 @@ type filterOutSchedulablePodListProcessor struct { } // NewFilterOutSchedulablePodListProcessor creates a PodListProcessor filtering out schedulable pods -func NewFilterOutSchedulablePodListProcessor(predicateChecker predicatechecker.PredicateChecker, nodeFilter func(*framework.NodeInfo) bool) *filterOutSchedulablePodListProcessor { +func NewFilterOutSchedulablePodListProcessor(nodeFilter func(*framework.NodeInfo) bool) *filterOutSchedulablePodListProcessor { return &filterOutSchedulablePodListProcessor{ - schedulingSimulator: scheduling.NewHintingSimulator(predicateChecker), + schedulingSimulator: scheduling.NewHintingSimulator(), nodeFilter: nodeFilter, } } diff --git a/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable_test.go b/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable_test.go index 7b0054f9a2f2..d3f9de91653d 100644 --- a/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable_test.go +++ b/cluster-autoscaler/core/podlistprocessor/filter_out_schedulable_test.go @@ -25,16 +25,15 @@ import ( apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/simulator/scheduling" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) func TestFilterOutSchedulable(t *testing.T) { - schedulermetrics.Register() - node := buildReadyTestNode("node", 2000, 100) matchesAllNodes := func(*framework.NodeInfo) bool { return true } matchesNoNodes := func(*framework.NodeInfo) bool { return false } @@ -176,9 +175,7 @@ func TestFilterOutSchedulable(t *testing.T) { for tn, tc := range testCases { t.Run(tn, func(t *testing.T) { - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(t, err) + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(t) var allExpectedScheduledPods []*apiv1.Pod allExpectedScheduledPods = append(allExpectedScheduledPods, tc.expectedScheduledPods...) @@ -194,7 +191,7 @@ func TestFilterOutSchedulable(t *testing.T) { clusterSnapshot.Fork() - processor := NewFilterOutSchedulablePodListProcessor(predicateChecker, tc.nodeFilter) + processor := NewFilterOutSchedulablePodListProcessor(tc.nodeFilter) unschedulablePods, err := processor.filterOutSchedulableByPacking(tc.unschedulableCandidates, clusterSnapshot) assert.NoError(t, err) @@ -253,8 +250,12 @@ func BenchmarkFilterOutSchedulable(b *testing.B) { }, } snapshots := map[string]func() clustersnapshot.ClusterSnapshot{ - "basic": func() clustersnapshot.ClusterSnapshot { return clustersnapshot.NewBasicClusterSnapshot() }, - "delta": func() clustersnapshot.ClusterSnapshot { return clustersnapshot.NewDeltaClusterSnapshot() }, + "basic": func() clustersnapshot.ClusterSnapshot { + return testsnapshot.NewCustomTestSnapshotOrDie(b, base.NewBasicSnapshotBase()) + }, + "delta": func() clustersnapshot.ClusterSnapshot { + return testsnapshot.NewCustomTestSnapshotOrDie(b, base.NewDeltaSnapshotBase()) + }, } for snapshotName, snapshotFactory := range snapshots { for _, tc := range tests { @@ -279,18 +280,15 @@ func BenchmarkFilterOutSchedulable(b *testing.B) { } } - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(b, err) - clusterSnapshot := snapshotFactory() - if err := clusterSnapshot.SetClusterState(nodes, scheduledPods); err != nil { + if err := clusterSnapshot.SetClusterState(nodes, scheduledPods, drasnapshot.Snapshot{}); err != nil { assert.NoError(b, err) } b.ResetTimer() for i := 0; i < b.N; i++ { - processor := NewFilterOutSchedulablePodListProcessor(predicateChecker, scheduling.ScheduleAnywhere) + processor := NewFilterOutSchedulablePodListProcessor(scheduling.ScheduleAnywhere) if stillPending, err := processor.filterOutSchedulableByPacking(pendingPods, clusterSnapshot); err != nil { assert.NoError(b, err) } else if len(stillPending) < tc.pendingPods { diff --git a/cluster-autoscaler/core/podlistprocessor/pod_list_processor.go b/cluster-autoscaler/core/podlistprocessor/pod_list_processor.go index 9557b134c2cc..cff1f6587d04 100644 --- a/cluster-autoscaler/core/podlistprocessor/pod_list_processor.go +++ b/cluster-autoscaler/core/podlistprocessor/pod_list_processor.go @@ -19,17 +19,16 @@ package podlistprocessor import ( "k8s.io/autoscaler/cluster-autoscaler/processors/pods" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" ) // NewDefaultPodListProcessor returns a default implementation of the pod list // processor, which wraps and sequentially runs other sub-processors. -func NewDefaultPodListProcessor(predicateChecker predicatechecker.PredicateChecker, nodeFilter func(*framework.NodeInfo) bool) *pods.CombinedPodListProcessor { +func NewDefaultPodListProcessor(nodeFilter func(*framework.NodeInfo) bool) *pods.CombinedPodListProcessor { return pods.NewCombinedPodListProcessor([]pods.PodListProcessor{ NewClearTPURequestsPodListProcessor(), NewFilterOutExpendablePodListProcessor(), NewCurrentlyDrainedNodesPodListProcessor(), - NewFilterOutSchedulablePodListProcessor(predicateChecker, nodeFilter), + NewFilterOutSchedulablePodListProcessor(nodeFilter), NewFilterOutDaemonSetPodListProcessor(), }) } diff --git a/cluster-autoscaler/core/scaledown/actuation/actuator.go b/cluster-autoscaler/core/scaledown/actuation/actuator.go index a85410172684..5b4e2359eb8b 100644 --- a/cluster-autoscaler/core/scaledown/actuation/actuator.go +++ b/cluster-autoscaler/core/scaledown/actuation/actuator.go @@ -33,7 +33,10 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/observers/nodegroupchange" "k8s.io/autoscaler/cluster-autoscaler/simulator" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/predicate" "k8s.io/autoscaler/cluster-autoscaler/simulator/drainability/rules" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/options" "k8s.io/autoscaler/cluster-autoscaler/simulator/utilization" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" @@ -356,7 +359,7 @@ func (a *Actuator) taintNode(node *apiv1.Node) error { } func (a *Actuator) createSnapshot(nodes []*apiv1.Node) (clustersnapshot.ClusterSnapshot, error) { - snapshot := clustersnapshot.NewBasicClusterSnapshot() + snapshot := predicate.NewPredicateSnapshot(base.NewBasicSnapshotBase(), a.ctx.FrameworkHandle, a.ctx.DynamicResourceAllocationEnabled) pods, err := a.ctx.AllPodLister().List() if err != nil { return nil, err @@ -365,7 +368,7 @@ func (a *Actuator) createSnapshot(nodes []*apiv1.Node) (clustersnapshot.ClusterS scheduledPods := kube_util.ScheduledPods(pods) nonExpendableScheduledPods := utils.FilterOutExpendablePods(scheduledPods, a.ctx.ExpendablePodsPriorityCutoff) - err = snapshot.SetClusterState(nodes, nonExpendableScheduledPods) + err = snapshot.SetClusterState(nodes, nonExpendableScheduledPods, drasnapshot.Snapshot{}) if err != nil { return nil, err } diff --git a/cluster-autoscaler/core/scaledown/actuation/actuator_test.go b/cluster-autoscaler/core/scaledown/actuation/actuator_test.go index 6f44abaf06b6..9a278f4f6eb0 100644 --- a/cluster-autoscaler/core/scaledown/actuation/actuator_test.go +++ b/cluster-autoscaler/core/scaledown/actuation/actuator_test.go @@ -24,6 +24,7 @@ import ( "github.com/google/go-cmp/cmp" "github.com/google/go-cmp/cmp/cmpopts" + appsv1 "k8s.io/api/apps/v1" apiv1 "k8s.io/api/core/v1" policyv1 "k8s.io/api/policy/v1" @@ -50,7 +51,6 @@ import ( . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/client-go/kubernetes/fake" core "k8s.io/client-go/testing" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) type nodeGroupViewInfo struct { @@ -1000,8 +1000,6 @@ func getStartDeletionTestCases(ignoreDaemonSetsUtilization bool, suffix string) } func TestStartDeletion(t *testing.T) { - schedulermetrics.Register() - testSets := []map[string]startDeletionTestCase{ // IgnoreDaemonSetsUtilization is false getStartDeletionTestCases(false, "testNg1"), diff --git a/cluster-autoscaler/core/scaledown/actuation/drain_test.go b/cluster-autoscaler/core/scaledown/actuation/drain_test.go index 6ba905761db5..962a707990dc 100644 --- a/cluster-autoscaler/core/scaledown/actuation/drain_test.go +++ b/cluster-autoscaler/core/scaledown/actuation/drain_test.go @@ -26,6 +26,7 @@ import ( "github.com/google/go-cmp/cmp" "github.com/google/go-cmp/cmp/cmpopts" "github.com/stretchr/testify/assert" + apiv1 "k8s.io/api/core/v1" policyv1beta1 "k8s.io/api/policy/v1beta1" "k8s.io/apimachinery/pkg/api/errors" @@ -37,6 +38,7 @@ import ( . "k8s.io/autoscaler/cluster-autoscaler/core/test" "k8s.io/autoscaler/cluster-autoscaler/core/utils" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/utils/daemonset" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" @@ -611,7 +613,7 @@ func TestPodsToEvict(t *testing.T) { }, } { t.Run(tn, func(t *testing.T) { - snapshot := clustersnapshot.NewBasicClusterSnapshot() + snapshot := testsnapshot.NewTestSnapshotOrDie(t) node := BuildTestNode("test-node", 1000, 1000) err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, tc.pods...)) if err != nil { diff --git a/cluster-autoscaler/core/scaledown/eligibility/eligibility.go b/cluster-autoscaler/core/scaledown/eligibility/eligibility.go index faa2b6d6d3ef..81c8044e3af9 100644 --- a/cluster-autoscaler/core/scaledown/eligibility/eligibility.go +++ b/cluster-autoscaler/core/scaledown/eligibility/eligibility.go @@ -31,7 +31,7 @@ import ( apiv1 "k8s.io/api/core/v1" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" - klog "k8s.io/klog/v2" + "k8s.io/klog/v2" ) const ( diff --git a/cluster-autoscaler/core/scaledown/eligibility/eligibility_test.go b/cluster-autoscaler/core/scaledown/eligibility/eligibility_test.go index 23397ab4327e..b585d5951517 100644 --- a/cluster-autoscaler/core/scaledown/eligibility/eligibility_test.go +++ b/cluster-autoscaler/core/scaledown/eligibility/eligibility_test.go @@ -21,6 +21,9 @@ import ( "testing" "time" + "github.com/stretchr/testify/assert" + + apiv1 "k8s.io/api/core/v1" testprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/test" "k8s.io/autoscaler/cluster-autoscaler/config" "k8s.io/autoscaler/cluster-autoscaler/core/scaledown/unremovable" @@ -29,10 +32,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" - apiv1 "k8s.io/api/core/v1" "k8s.io/client-go/kubernetes/fake" ) @@ -149,8 +148,6 @@ func getTestCases(ignoreDaemonSetsUtilization bool, suffix string, now time.Time } func TestFilterOutUnremovable(t *testing.T) { - schedulermetrics.Register() - now := time.Now() for _, tc := range append(getTestCases(false, "IgnoreDaemonSetUtilization=false", now), getTestCases(true, "IgnoreDaemonsetUtilization=true", now)...) { diff --git a/cluster-autoscaler/core/scaledown/planner/planner.go b/cluster-autoscaler/core/scaledown/planner/planner.go index 2898e240cb05..32be506ca7ab 100644 --- a/cluster-autoscaler/core/scaledown/planner/planner.go +++ b/cluster-autoscaler/core/scaledown/planner/planner.go @@ -89,8 +89,8 @@ func New(context *context.AutoscalingContext, processors *processors.Autoscaling context: context, unremovableNodes: unremovable.NewNodes(), unneededNodes: unneeded.NewNodes(processors.NodeGroupConfigProcessor, resourceLimitsFinder), - rs: simulator.NewRemovalSimulator(context.ListerRegistry, context.ClusterSnapshot, context.PredicateChecker, deleteOptions, drainabilityRules, true), - actuationInjector: scheduling.NewHintingSimulator(context.PredicateChecker), + rs: simulator.NewRemovalSimulator(context.ListerRegistry, context.ClusterSnapshot, deleteOptions, drainabilityRules, true), + actuationInjector: scheduling.NewHintingSimulator(), eligibilityChecker: eligibility.NewChecker(processors.NodeGroupConfigProcessor), nodeUtilizationMap: make(map[string]utilization.Info), resourceLimitsFinder: resourceLimitsFinder, diff --git a/cluster-autoscaler/core/scaledown/planner/planner_test.go b/cluster-autoscaler/core/scaledown/planner/planner_test.go index 0aa4881a9613..fc3fe854be23 100644 --- a/cluster-autoscaler/core/scaledown/planner/planner_test.go +++ b/cluster-autoscaler/core/scaledown/planner/planner_test.go @@ -22,6 +22,7 @@ import ( "time" "github.com/stretchr/testify/assert" + appsv1 "k8s.io/api/apps/v1" apiv1 "k8s.io/api/core/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" @@ -44,12 +45,9 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/utils/taints" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/client-go/kubernetes/fake" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) func TestUpdateClusterState(t *testing.T) { - schedulermetrics.Register() - testCases := []struct { name string nodes []*apiv1.Node diff --git a/cluster-autoscaler/core/scaledown/unneeded/nodes_test.go b/cluster-autoscaler/core/scaledown/unneeded/nodes_test.go index 51048eb57df5..05f450150fe3 100644 --- a/cluster-autoscaler/core/scaledown/unneeded/nodes_test.go +++ b/cluster-autoscaler/core/scaledown/unneeded/nodes_test.go @@ -21,6 +21,8 @@ import ( "testing" "time" + "github.com/stretchr/testify/assert" + apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" testprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/test" @@ -33,9 +35,6 @@ import ( kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/client-go/kubernetes/fake" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" ) func TestUpdate(t *testing.T) { @@ -129,8 +128,6 @@ func version(n simulator.NodeToBeRemoved) string { } func TestRemovableAt(t *testing.T) { - schedulermetrics.Register() - testCases := []struct { name string numEmpty int diff --git a/cluster-autoscaler/core/scaleup/orchestrator/async_initializer.go b/cluster-autoscaler/core/scaleup/orchestrator/async_initializer.go index de2dabf600bc..a8e82b87e7ba 100644 --- a/cluster-autoscaler/core/scaleup/orchestrator/async_initializer.go +++ b/cluster-autoscaler/core/scaleup/orchestrator/async_initializer.go @@ -25,10 +25,10 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" "k8s.io/autoscaler/cluster-autoscaler/context" - "k8s.io/autoscaler/cluster-autoscaler/core/utils" "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroups" "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroupset" "k8s.io/autoscaler/cluster-autoscaler/processors/status" + "k8s.io/autoscaler/cluster-autoscaler/simulator" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" @@ -110,7 +110,7 @@ func (s *AsyncNodeGroupInitializer) InitializeNodeGroup(result nodegroups.AsyncN mainCreatedNodeGroup := result.CreationResult.MainCreatedNodeGroup // If possible replace candidate node-info with node info based on crated node group. The latter // one should be more in line with nodes which will be created by node group. - nodeInfo, aErr := utils.GetNodeInfoFromTemplate(mainCreatedNodeGroup, s.daemonSets, s.taintConfig) + nodeInfo, aErr := simulator.TemplateNodeInfoFromNodeGroupTemplate(mainCreatedNodeGroup, s.daemonSets, s.taintConfig) if aErr != nil { klog.Warningf("Cannot build node info for newly created main node group %s. Using fallback. Error: %v", mainCreatedNodeGroup.Id(), aErr) nodeInfo = s.nodeInfo diff --git a/cluster-autoscaler/core/scaleup/orchestrator/orchestrator.go b/cluster-autoscaler/core/scaleup/orchestrator/orchestrator.go index 8eb316c594b2..73161a658e7f 100644 --- a/cluster-autoscaler/core/scaleup/orchestrator/orchestrator.go +++ b/cluster-autoscaler/core/scaleup/orchestrator/orchestrator.go @@ -27,7 +27,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/context" "k8s.io/autoscaler/cluster-autoscaler/core/scaleup/equivalence" "k8s.io/autoscaler/cluster-autoscaler/core/scaleup/resource" - "k8s.io/autoscaler/cluster-autoscaler/core/utils" "k8s.io/autoscaler/cluster-autoscaler/estimator" "k8s.io/autoscaler/cluster-autoscaler/expander" "k8s.io/autoscaler/cluster-autoscaler/metrics" @@ -35,6 +34,7 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroups" "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroupset" "k8s.io/autoscaler/cluster-autoscaler/processors/status" + "k8s.io/autoscaler/cluster-autoscaler/simulator" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" "k8s.io/autoscaler/cluster-autoscaler/utils/klogx" @@ -465,7 +465,6 @@ func (o *ScaleUpOrchestrator) ComputeExpansionOption( estimateStart := time.Now() expansionEstimator := o.estimatorBuilder( - o.autoscalingContext.PredicateChecker, o.autoscalingContext.ClusterSnapshot, estimator.NewEstimationContext(o.autoscalingContext.MaxNodesTotal, option.SimilarNodeGroups, currentNodeCount), ) @@ -527,7 +526,7 @@ func (o *ScaleUpOrchestrator) CreateNodeGroup( // If possible replace candidate node-info with node info based on crated node group. The latter // one should be more in line with nodes which will be created by node group. - mainCreatedNodeInfo, aErr := utils.GetNodeInfoFromTemplate(createNodeGroupResult.MainCreatedNodeGroup, daemonSets, o.taintConfig) + mainCreatedNodeInfo, aErr := simulator.TemplateNodeInfoFromNodeGroupTemplate(createNodeGroupResult.MainCreatedNodeGroup, daemonSets, o.taintConfig) if aErr == nil { nodeInfos[createNodeGroupResult.MainCreatedNodeGroup.Id()] = mainCreatedNodeInfo schedulablePodGroups[createNodeGroupResult.MainCreatedNodeGroup.Id()] = o.SchedulablePodGroups(podEquivalenceGroups, createNodeGroupResult.MainCreatedNodeGroup, mainCreatedNodeInfo) @@ -542,7 +541,7 @@ func (o *ScaleUpOrchestrator) CreateNodeGroup( delete(schedulablePodGroups, oldId) } for _, nodeGroup := range createNodeGroupResult.ExtraCreatedNodeGroups { - nodeInfo, aErr := utils.GetNodeInfoFromTemplate(nodeGroup, daemonSets, o.taintConfig) + nodeInfo, aErr := simulator.TemplateNodeInfoFromNodeGroupTemplate(nodeGroup, daemonSets, o.taintConfig) if aErr != nil { klog.Warningf("Cannot build node info for newly created extra node group %v; balancing similar node groups will not work; err=%v", nodeGroup.Id(), aErr) continue @@ -577,7 +576,7 @@ func (o *ScaleUpOrchestrator) SchedulablePodGroups( var schedulablePodGroups []estimator.PodEquivalenceGroup for _, eg := range podEquivalenceGroups { samplePod := eg.Pods[0] - if err := o.autoscalingContext.PredicateChecker.CheckPredicates(o.autoscalingContext.ClusterSnapshot, samplePod, nodeInfo.Node().Name); err == nil { + if err := o.autoscalingContext.ClusterSnapshot.CheckPredicates(samplePod, nodeInfo.Node().Name); err == nil { // Add pods to option. schedulablePodGroups = append(schedulablePodGroups, estimator.PodEquivalenceGroup{ Pods: eg.Pods, @@ -586,7 +585,7 @@ func (o *ScaleUpOrchestrator) SchedulablePodGroups( eg.Schedulable = true eg.SchedulableGroups = append(eg.SchedulableGroups, nodeGroup.Id()) } else { - klog.V(2).Infof("Pod %s/%s can't be scheduled on %s, predicate checking error: %v", samplePod.Namespace, samplePod.Name, nodeGroup.Id(), err.VerboseMessage()) + klog.V(2).Infof("Pod %s/%s can't be scheduled on %s, predicate checking error: %v", samplePod.Namespace, samplePod.Name, nodeGroup.Id(), err) if podCount := len(eg.Pods); podCount > 1 { klog.V(2).Infof("%d other pods similar to %s can't be scheduled on %s", podCount-1, samplePod.Name, nodeGroup.Id()) } diff --git a/cluster-autoscaler/core/scaleup/orchestrator/orchestrator_test.go b/cluster-autoscaler/core/scaleup/orchestrator/orchestrator_test.go index a1cdd15eba91..e23fd8c05bdf 100644 --- a/cluster-autoscaler/core/scaleup/orchestrator/orchestrator_test.go +++ b/cluster-autoscaler/core/scaleup/orchestrator/orchestrator_test.go @@ -26,13 +26,9 @@ import ( "testing" "time" - "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroupconfig" - "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroups/asyncnodegroups" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - kube_record "k8s.io/client-go/tools/record" - "k8s.io/component-base/metrics/legacyregistry" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - + appsv1 "k8s.io/api/apps/v1" + apiv1 "k8s.io/api/core/v1" + v1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" testprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/test" "k8s.io/autoscaler/cluster-autoscaler/clusterstate" @@ -44,20 +40,22 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/estimator" "k8s.io/autoscaler/cluster-autoscaler/metrics" "k8s.io/autoscaler/cluster-autoscaler/processors" + "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroupconfig" + "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroups/asyncnodegroups" "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroupset" "k8s.io/autoscaler/cluster-autoscaler/processors/nodeinfosprovider" "k8s.io/autoscaler/cluster-autoscaler/processors/status" processorstest "k8s.io/autoscaler/cluster-autoscaler/processors/test" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/autoscaler/cluster-autoscaler/utils/units" - - appsv1 "k8s.io/api/apps/v1" - apiv1 "k8s.io/api/core/v1" - v1 "k8s.io/api/core/v1" "k8s.io/client-go/kubernetes/fake" + kube_record "k8s.io/client-go/tools/record" + "k8s.io/component-base/metrics/legacyregistry" "github.com/stretchr/testify/assert" ) @@ -72,8 +70,6 @@ var defaultOptions = config.AutoscalingOptions{ // Scale up scenarios. func TestScaleUpOK(t *testing.T) { - schedulermetrics.Register() - config := &ScaleUpTestConfig{ Nodes: []NodeConfig{ {Name: "n1", Cpu: 100, Memory: 100, Gpu: 0, Ready: true, Group: "ng1"}, @@ -1049,6 +1045,8 @@ func runSimpleScaleUpTest(t *testing.T, config *ScaleUpTestConfig) *ScaleUpTestR // build orchestrator context, err := NewScaleTestAutoscalingContext(options, &fake.Clientset{}, listers, provider, nil, nil) assert.NoError(t, err) + err = context.ClusterSnapshot.SetClusterState(nodes, kube_util.ScheduledPods(pods), drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, err := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false). Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) @@ -1130,13 +1128,15 @@ func TestScaleUpUnhealthy(t *testing.T) { SetNodeReadyState(n1, true, someTimeAgo) n2 := BuildTestNode("n2", 1000, 1000) SetNodeReadyState(n2, true, someTimeAgo) + nodes := []*apiv1.Node{n1, n2} p1 := BuildTestPod("p1", 80, 0) p2 := BuildTestPod("p2", 800, 0) p1.Spec.NodeName = "n1" p2.Spec.NodeName = "n2" + pods := []*apiv1.Pod{p1, p2} - podLister := kube_util.NewTestPodLister([]*apiv1.Pod{p1, p2}) + podLister := kube_util.NewTestPodLister(pods) listers := kube_util.NewListerRegistry(nil, nil, podLister, nil, nil, nil, nil, nil, nil) provider := testprovider.NewTestCloudProvider(func(nodeGroup string, increase int) error { @@ -1155,8 +1155,8 @@ func TestScaleUpUnhealthy(t *testing.T) { } context, err := NewScaleTestAutoscalingContext(options, &fake.Clientset{}, listers, provider, nil, nil) assert.NoError(t, err) - - nodes := []*apiv1.Node{n1, n2} + err = context.ClusterSnapshot.SetClusterState(nodes, pods, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) clusterState := clusterstate.NewClusterStateRegistry(provider, clusterstate.ClusterStateRegistryConfig{}, context.LogRecorder, NewBackoff(), nodegroupconfig.NewDefaultNodeGroupConfigProcessor(config.NodeGroupAutoscalingOptions{MaxNodeProvisionTime: 15 * time.Minute}), asyncnodegroups.NewDefaultAsyncNodeGroupStateChecker()) clusterState.UpdateNodes(nodes, nodeInfos, time.Now()) @@ -1198,7 +1198,8 @@ func TestBinpackingLimiter(t *testing.T) { context, err := NewScaleTestAutoscalingContext(options, &fake.Clientset{}, listers, provider, nil, nil) assert.NoError(t, err) - + err = context.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, err := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false). Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) @@ -1233,11 +1234,13 @@ func TestScaleUpNoHelp(t *testing.T) { n1 := BuildTestNode("n1", 100, 1000) now := time.Now() SetNodeReadyState(n1, true, now.Add(-2*time.Minute)) + nodes := []*apiv1.Node{n1} p1 := BuildTestPod("p1", 80, 0) p1.Spec.NodeName = "n1" + pods := []*apiv1.Pod{p1} - podLister := kube_util.NewTestPodLister([]*apiv1.Pod{p1}) + podLister := kube_util.NewTestPodLister(pods) listers := kube_util.NewListerRegistry(nil, nil, podLister, nil, nil, nil, nil, nil, nil) provider := testprovider.NewTestCloudProvider(func(nodeGroup string, increase int) error { @@ -1255,8 +1258,8 @@ func TestScaleUpNoHelp(t *testing.T) { } context, err := NewScaleTestAutoscalingContext(options, &fake.Clientset{}, listers, provider, nil, nil) assert.NoError(t, err) - - nodes := []*apiv1.Node{n1} + err = context.ClusterSnapshot.SetClusterState(nodes, pods, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) clusterState := clusterstate.NewClusterStateRegistry(provider, clusterstate.ClusterStateRegistryConfig{}, context.LogRecorder, NewBackoff(), nodegroupconfig.NewDefaultNodeGroupConfigProcessor(config.NodeGroupAutoscalingOptions{MaxNodeProvisionTime: 15 * time.Minute}), asyncnodegroups.NewDefaultAsyncNodeGroupStateChecker()) clusterState.UpdateNodes(nodes, nodeInfos, time.Now()) @@ -1410,7 +1413,8 @@ func TestComputeSimilarNodeGroups(t *testing.T) { listers := kube_util.NewListerRegistry(nil, nil, kube_util.NewTestPodLister(nil), nil, nil, nil, nil, nil, nil) ctx, err := NewScaleTestAutoscalingContext(config.AutoscalingOptions{BalanceSimilarNodeGroups: tc.balancingEnabled}, &fake.Clientset{}, listers, provider, nil, nil) assert.NoError(t, err) - + err = ctx.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) clusterState := clusterstate.NewClusterStateRegistry(provider, clusterstate.ClusterStateRegistryConfig{}, ctx.LogRecorder, NewBackoff(), nodegroupconfig.NewDefaultNodeGroupConfigProcessor(config.NodeGroupAutoscalingOptions{MaxNodeProvisionTime: 15 * time.Minute}), asyncnodegroups.NewDefaultAsyncNodeGroupStateChecker()) assert.NoError(t, clusterState.UpdateNodes(nodes, nodeInfos, time.Now())) @@ -1474,7 +1478,8 @@ func TestScaleUpBalanceGroups(t *testing.T) { } context, err := NewScaleTestAutoscalingContext(options, &fake.Clientset{}, listers, provider, nil, nil) assert.NoError(t, err) - + err = context.ClusterSnapshot.SetClusterState(nodes, podList, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) clusterState := clusterstate.NewClusterStateRegistry(provider, clusterstate.ClusterStateRegistryConfig{}, context.LogRecorder, NewBackoff(), nodegroupconfig.NewDefaultNodeGroupConfigProcessor(config.NodeGroupAutoscalingOptions{MaxNodeProvisionTime: 15 * time.Minute}), asyncnodegroups.NewDefaultAsyncNodeGroupStateChecker()) clusterState.UpdateNodes(nodes, nodeInfos, time.Now()) @@ -1650,6 +1655,8 @@ func TestScaleUpToMeetNodeGroupMinSize(t *testing.T) { assert.NoError(t, err) nodes := []*apiv1.Node{n1, n2} + err = context.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, time.Now()) processors := processorstest.NewTestProcessors(&context) clusterState := clusterstate.NewClusterStateRegistry(provider, clusterstate.ClusterStateRegistryConfig{}, context.LogRecorder, NewBackoff(), nodegroupconfig.NewDefaultNodeGroupConfigProcessor(config.NodeGroupAutoscalingOptions{MaxNodeProvisionTime: 15 * time.Minute}), asyncnodegroups.NewDefaultAsyncNodeGroupStateChecker()) diff --git a/cluster-autoscaler/core/scaleup/resource/manager_test.go b/cluster-autoscaler/core/scaleup/resource/manager_test.go index ac1204be1b55..8ed7b580118e 100644 --- a/cluster-autoscaler/core/scaleup/resource/manager_test.go +++ b/cluster-autoscaler/core/scaleup/resource/manager_test.go @@ -22,6 +22,7 @@ import ( "time" "github.com/stretchr/testify/assert" + appsv1 "k8s.io/api/apps/v1" corev1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" @@ -31,11 +32,11 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/core/test" "k8s.io/autoscaler/cluster-autoscaler/processors/nodeinfosprovider" processorstest "k8s.io/autoscaler/cluster-autoscaler/processors/test" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" utils_test "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/client-go/kubernetes/fake" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) type nodeGroupConfig struct { @@ -53,8 +54,6 @@ type deltaForNodeTestCase struct { } func TestDeltaForNode(t *testing.T) { - schedulermetrics.Register() - testCases := []deltaForNodeTestCase{ { nodeGroupConfig: nodeGroupConfig{Name: "ng1", Min: 3, Max: 10, Size: 5, CPU: 8, Mem: 16}, @@ -73,6 +72,8 @@ func TestDeltaForNode(t *testing.T) { ng := testCase.nodeGroupConfig group, nodes := newNodeGroup(t, cp, ng.Name, ng.Min, ng.Max, ng.Size, ng.CPU, ng.Mem) + err := ctx.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, time.Now()) rm := NewManager(processors.CustomResourcesProcessor) @@ -114,6 +115,8 @@ func TestResourcesLeft(t *testing.T) { ng := testCase.nodeGroupConfig _, nodes := newNodeGroup(t, cp, ng.Name, ng.Min, ng.Max, ng.Size, ng.CPU, ng.Mem) + err := ctx.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, time.Now()) rm := NewManager(processors.CustomResourcesProcessor) @@ -165,6 +168,8 @@ func TestApplyLimits(t *testing.T) { ng := testCase.nodeGroupConfig group, nodes := newNodeGroup(t, cp, ng.Name, ng.Min, ng.Max, ng.Size, ng.CPU, ng.Mem) + err := ctx.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, time.Now()) rm := NewManager(processors.CustomResourcesProcessor) @@ -230,6 +235,8 @@ func TestResourceManagerWithGpuResource(t *testing.T) { assert.NoError(t, err) nodes := []*corev1.Node{n1} + err = context.ClusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) + assert.NoError(t, err) nodeInfos, _ := nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nil, false).Process(&context, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, time.Now()) rm := NewManager(processors.CustomResourcesProcessor) diff --git a/cluster-autoscaler/core/static_autoscaler.go b/cluster-autoscaler/core/static_autoscaler.go index 6902b13df35c..88e40e448336 100644 --- a/cluster-autoscaler/core/static_autoscaler.go +++ b/cluster-autoscaler/core/static_autoscaler.go @@ -46,13 +46,12 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/simulator" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/drainability/rules" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/simulator/options" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/utils/backoff" caerrors "k8s.io/autoscaler/cluster-autoscaler/utils/errors" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" - scheduler_utils "k8s.io/autoscaler/cluster-autoscaler/utils/scheduler" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" "k8s.io/utils/integer" @@ -132,7 +131,7 @@ func (callbacks *staticAutoscalerProcessorCallbacks) reset() { // NewStaticAutoscaler creates an instance of Autoscaler filled with provided parameters func NewStaticAutoscaler( opts config.AutoscalingOptions, - predicateChecker predicatechecker.PredicateChecker, + fwHandle *framework.Handle, clusterSnapshot clustersnapshot.ClusterSnapshot, autoscalingKubeClients *context.AutoscalingKubeClients, processors *ca_processors.AutoscalingProcessors, @@ -155,7 +154,7 @@ func NewStaticAutoscaler( processorCallbacks := newStaticAutoscalerProcessorCallbacks() autoscalingContext := context.NewAutoscalingContext( opts, - predicateChecker, + fwHandle, clusterSnapshot, autoscalingKubeClients, cloudProvider, @@ -339,7 +338,7 @@ func (a *StaticAutoscaler) RunOnce(currentTime time.Time) caerrors.AutoscalerErr } nonExpendableScheduledPods := core_utils.FilterOutExpendablePods(originalScheduledPods, a.ExpendablePodsPriorityCutoff) // Initialize cluster state to ClusterSnapshot - if err := a.ClusterSnapshot.SetClusterState(allNodes, nonExpendableScheduledPods); err != nil { + if err := a.ClusterSnapshot.SetClusterState(allNodes, nonExpendableScheduledPods, drasnapshot.Snapshot{}); err != nil { return caerrors.ToAutoscalerError(caerrors.InternalError, err).AddPrefix("failed to initialize ClusterSnapshot: ") } // Initialize Pod Disruption Budget tracking @@ -1028,7 +1027,7 @@ func getUpcomingNodeInfos(upcomingCounts map[string]int, nodeInfos map[string]*f // Ensure new nodes have different names because nodeName // will be used as a map key. Also deep copy pods (daemonsets & // any pods added by cloud provider on template). - nodes = append(nodes, scheduler_utils.DeepCopyTemplateNode(nodeTemplate, fmt.Sprintf("upcoming-%d", i))) + nodes = append(nodes, simulator.FreshNodeInfoFromTemplateNodeInfo(nodeTemplate, fmt.Sprintf("upcoming-%d", i))) } upcomingNodes[nodeGroup] = nodes } diff --git a/cluster-autoscaler/core/static_autoscaler_test.go b/cluster-autoscaler/core/static_autoscaler_test.go index 2df10d4b7355..ec0b084a752b 100644 --- a/cluster-autoscaler/core/static_autoscaler_test.go +++ b/cluster-autoscaler/core/static_autoscaler_test.go @@ -27,6 +27,16 @@ import ( "testing" "time" + "github.com/google/go-cmp/cmp" + "github.com/google/go-cmp/cmp/cmpopts" + "github.com/stretchr/testify/assert" + "github.com/stretchr/testify/mock" + + appsv1 "k8s.io/api/apps/v1" + apiv1 "k8s.io/api/core/v1" + policyv1 "k8s.io/api/policy/v1" + metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" + "k8s.io/apimachinery/pkg/labels" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" mockprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/mocks" testprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/test" @@ -63,22 +73,10 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/utils/scheduler" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - kube_record "k8s.io/client-go/tools/record" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - appsv1 "k8s.io/api/apps/v1" - apiv1 "k8s.io/api/core/v1" - policyv1 "k8s.io/api/policy/v1" - metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" - "k8s.io/apimachinery/pkg/labels" "k8s.io/client-go/kubernetes/fake" v1appslister "k8s.io/client-go/listers/apps/v1" - - "github.com/google/go-cmp/cmp" - "github.com/google/go-cmp/cmp/cmpopts" - "github.com/stretchr/testify/assert" - "github.com/stretchr/testify/mock" - klog "k8s.io/klog/v2" + kube_record "k8s.io/client-go/tools/record" + "k8s.io/klog/v2" ) type podListerMock struct { @@ -313,8 +311,6 @@ func setupAutoscaler(config *autoscalerSetupConfig) (*StaticAutoscaler, error) { // TODO: Refactor tests to use setupAutoscaler func TestStaticAutoscalerRunOnce(t *testing.T) { - schedulermetrics.Register() - readyNodeLister := kubernetes.NewTestNodeLister(nil) allNodeLister := kubernetes.NewTestNodeLister(nil) allPodListerMock := &podListerMock{} @@ -406,7 +402,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // MaxNodesTotal reached. readyNodeLister.SetNodes([]*apiv1.Node{n1}) allNodeLister.SetNodes([]*apiv1.Node{n1}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -417,7 +413,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // Scale up. readyNodeLister.SetNodes([]*apiv1.Node{n1}) allNodeLister.SetNodes([]*apiv1.Node{n1}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() onScaleUpMock.On("ScaleUp", "ng1", 1).Return(nil).Once() @@ -431,7 +427,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // Mark unneeded nodes. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -446,7 +442,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // Scale down. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Times(3) + allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Twice() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() onScaleDownMock.On("ScaleDown", "ng1", "n2").Return(nil).Once() @@ -460,7 +456,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // Mark unregistered nodes. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -475,7 +471,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // Remove unregistered nodes. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() onScaleDownMock.On("ScaleDown", "ng2", "n3").Return(nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -489,7 +485,7 @@ func TestStaticAutoscalerRunOnce(t *testing.T) { // Scale up to node group min size. readyNodeLister.SetNodes([]*apiv1.Node{n4}) allNodeLister.SetNodes([]*apiv1.Node{n4}) - allPodListerMock.On("List").Return([]*apiv1.Pod{}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil) podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil) onScaleUpMock.On("ScaleUp", "ng3", 2).Return(nil).Once() // 2 new nodes are supposed to be scaled up. @@ -689,7 +685,7 @@ func TestStaticAutoscalerRunOnceWithScaleDownDelayPerNG(t *testing.T) { // Mark unneeded nodes. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -701,7 +697,7 @@ func TestStaticAutoscalerRunOnceWithScaleDownDelayPerNG(t *testing.T) { // Scale down nodegroup readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Times(3) + allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Twice() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil) onScaleDownMock.On("ScaleDown", tc.expectedScaleDownNG, tc.expectedScaleDownNode).Return(nil).Once() @@ -828,7 +824,7 @@ func TestStaticAutoscalerRunOnceWithAutoprovisionedEnabled(t *testing.T) { // Scale up. readyNodeLister.SetNodes([]*apiv1.Node{n1}) allNodeLister.SetNodes([]*apiv1.Node{n1}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() onNodeGroupCreateMock.On("Create", "autoprovisioned-TN2").Return(nil).Once() @@ -845,7 +841,7 @@ func TestStaticAutoscalerRunOnceWithAutoprovisionedEnabled(t *testing.T) { // Remove autoprovisioned node group and mark unneeded nodes. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() onNodeGroupDeleteMock.On("Delete", "autoprovisioned-TN1").Return(nil).Once() @@ -861,7 +857,7 @@ func TestStaticAutoscalerRunOnceWithAutoprovisionedEnabled(t *testing.T) { // Scale down. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Times(3) + allPodListerMock.On("List").Return([]*apiv1.Pod{p1}, nil).Twice() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() onNodeGroupDeleteMock.On("Delete", "autoprovisioned-"+ @@ -984,7 +980,7 @@ func TestStaticAutoscalerRunOnceWithALongUnregisteredNode(t *testing.T) { // Scale up. readyNodeLister.SetNodes(nodes) allNodeLister.SetNodes(nodes) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() onScaleUpMock.On("ScaleUp", "ng1", 1).Return(nil).Once() @@ -1002,7 +998,7 @@ func TestStaticAutoscalerRunOnceWithALongUnregisteredNode(t *testing.T) { // Remove broken node readyNodeLister.SetNodes(nodes) allNodeLister.SetNodes(nodes) - allPodListerMock.On("List").Return([]*apiv1.Pod{}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{}, nil).Once() onScaleDownMock.On("ScaleDown", "ng1", "broken").Return(nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -1137,7 +1133,7 @@ func TestStaticAutoscalerRunOncePodsWithPriorities(t *testing.T) { // Scale up readyNodeLister.SetNodes([]*apiv1.Node{n1, n2, n3}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2, n3}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3, p4, p5, p6}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3, p4, p5, p6}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() onScaleUpMock.On("ScaleUp", "ng2", 1).Return(nil).Once() @@ -1150,7 +1146,7 @@ func TestStaticAutoscalerRunOncePodsWithPriorities(t *testing.T) { // Mark unneeded nodes. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2, n3}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2, n3}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3, p4, p5}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3, p4, p5}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -1164,7 +1160,7 @@ func TestStaticAutoscalerRunOncePodsWithPriorities(t *testing.T) { // Scale down. readyNodeLister.SetNodes([]*apiv1.Node{n1, n2, n3}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2, n3}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3, p4, p5}, nil).Times(3) + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3, p4, p5}, nil).Twice() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() onScaleDownMock.On("ScaleDown", "ng1", "n1").Return(nil).Once() @@ -1266,7 +1262,7 @@ func TestStaticAutoscalerRunOnceWithFilteringOnBinPackingEstimator(t *testing.T) // Scale up readyNodeLister.SetNodes([]*apiv1.Node{n1, n2}) allNodeLister.SetNodes([]*apiv1.Node{n1, n2}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p3, p4}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p3, p4}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -1365,7 +1361,7 @@ func TestStaticAutoscalerRunOnceWithFilteringOnUpcomingNodesEnabledNoScaleUp(t * // Scale up readyNodeLister.SetNodes([]*apiv1.Node{n2, n3}) allNodeLister.SetNodes([]*apiv1.Node{n2, n3}) - allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3}, nil).Twice() + allPodListerMock.On("List").Return([]*apiv1.Pod{p1, p2, p3}, nil).Once() daemonSetListerMock.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() podDisruptionBudgetListerMock.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() @@ -1566,7 +1562,7 @@ func TestStaticAutoscalerRunOnceWithBypassedSchedulers(t *testing.T) { tc.setupConfig.mocks.readyNodeLister.SetNodes([]*apiv1.Node{n1}) tc.setupConfig.mocks.allNodeLister.SetNodes([]*apiv1.Node{n1}) - tc.setupConfig.mocks.allPodLister.On("List").Return(tc.pods, nil).Twice() + tc.setupConfig.mocks.allPodLister.On("List").Return(tc.pods, nil).Once() tc.setupConfig.mocks.daemonSetLister.On("List", labels.Everything()).Return([]*appsv1.DaemonSet{}, nil).Once() tc.setupConfig.mocks.podDisruptionBudgetLister.On("List").Return([]*policyv1.PodDisruptionBudget{}, nil).Once() if tc.expectedScaleUp != nil { diff --git a/cluster-autoscaler/core/test/common.go b/cluster-autoscaler/core/test/common.go index 7dfc57b765ae..5abeffa27e85 100644 --- a/cluster-autoscaler/core/test/common.go +++ b/cluster-autoscaler/core/test/common.go @@ -36,9 +36,8 @@ import ( processor_callbacks "k8s.io/autoscaler/cluster-autoscaler/processors/callbacks" "k8s.io/autoscaler/cluster-autoscaler/processors/nodegroups" "k8s.io/autoscaler/cluster-autoscaler/processors/status" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/utils/backoff" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" @@ -175,15 +174,14 @@ func NewScaleTestAutoscalingContext( if err != nil { return context.AutoscalingContext{}, err } - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - if err != nil { - return context.AutoscalingContext{}, err - } remainingPdbTracker := pdb.NewBasicRemainingPdbTracker() if debuggingSnapshotter == nil { debuggingSnapshotter = debuggingsnapshot.NewDebuggingSnapshotter(false) } - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() + clusterSnapshot, err := testsnapshot.NewTestSnapshot() + if err != nil { + return context.AutoscalingContext{}, err + } return context.AutoscalingContext{ AutoscalingOptions: options, AutoscalingKubeClients: context.AutoscalingKubeClients{ @@ -193,7 +191,6 @@ func NewScaleTestAutoscalingContext( ListerRegistry: listers, }, CloudProvider: provider, - PredicateChecker: predicateChecker, ClusterSnapshot: clusterSnapshot, ExpanderStrategy: random.NewStrategy(), ProcessorCallbacks: processorCallbacks, diff --git a/cluster-autoscaler/core/utils/utils.go b/cluster-autoscaler/core/utils/utils.go index c25db2ef8453..1b493b783cfc 100644 --- a/cluster-autoscaler/core/utils/utils.go +++ b/cluster-autoscaler/core/utils/utils.go @@ -17,52 +17,17 @@ limitations under the License. package utils import ( - "fmt" - "math/rand" "reflect" "time" - appsv1 "k8s.io/api/apps/v1" apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" "k8s.io/autoscaler/cluster-autoscaler/clusterstate" "k8s.io/autoscaler/cluster-autoscaler/metrics" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/utils/daemonset" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" "k8s.io/autoscaler/cluster-autoscaler/utils/gpu" - "k8s.io/autoscaler/cluster-autoscaler/utils/labels" - "k8s.io/autoscaler/cluster-autoscaler/utils/taints" ) -// GetNodeInfoFromTemplate returns NodeInfo object built base on TemplateNodeInfo returned by NodeGroup.TemplateNodeInfo(). -func GetNodeInfoFromTemplate(nodeGroup cloudprovider.NodeGroup, daemonsets []*appsv1.DaemonSet, taintConfig taints.TaintConfig) (*framework.NodeInfo, errors.AutoscalerError) { - id := nodeGroup.Id() - baseNodeInfo, err := nodeGroup.TemplateNodeInfo() - if err != nil { - return nil, errors.ToAutoscalerError(errors.CloudProviderError, err) - } - - labels.UpdateDeprecatedLabels(baseNodeInfo.Node().ObjectMeta.Labels) - - sanitizedNode, typedErr := SanitizeNode(baseNodeInfo.Node(), id, taintConfig) - if err != nil { - return nil, typedErr - } - baseNodeInfo.SetNode(sanitizedNode) - - pods, err := daemonset.GetDaemonSetPodsForNode(baseNodeInfo, daemonsets) - if err != nil { - return nil, errors.ToAutoscalerError(errors.InternalError, err) - } - for _, podInfo := range baseNodeInfo.Pods() { - pods = append(pods, &framework.PodInfo{Pod: podInfo.Pod}) - } - - sanitizedNodeInfo := framework.NewNodeInfo(sanitizedNode, nil, SanitizePods(pods, sanitizedNode)...) - return sanitizedNodeInfo, nil -} - // isVirtualNode determines if the node is created by virtual kubelet func isVirtualNode(node *apiv1.Node) bool { return node.ObjectMeta.Labels["type"] == "virtual-kubelet" @@ -89,48 +54,6 @@ func FilterOutNodesFromNotAutoscaledGroups(nodes []*apiv1.Node, cloudProvider cl return result, nil } -// DeepCopyNodeInfo clones the provided nodeInfo -func DeepCopyNodeInfo(nodeInfo *framework.NodeInfo) *framework.NodeInfo { - newPods := make([]*framework.PodInfo, 0) - for _, podInfo := range nodeInfo.Pods() { - newPods = append(newPods, &framework.PodInfo{Pod: podInfo.Pod.DeepCopy()}) - } - - // Build a new node info. - newNodeInfo := framework.NewNodeInfo(nodeInfo.Node().DeepCopy(), nil, newPods...) - return newNodeInfo -} - -// SanitizeNode cleans up nodes used for node group templates -func SanitizeNode(node *apiv1.Node, nodeGroup string, taintConfig taints.TaintConfig) (*apiv1.Node, errors.AutoscalerError) { - newNode := node.DeepCopy() - nodeName := fmt.Sprintf("template-node-for-%s-%d", nodeGroup, rand.Int63()) - newNode.Labels = make(map[string]string, len(node.Labels)) - for k, v := range node.Labels { - if k != apiv1.LabelHostname { - newNode.Labels[k] = v - } else { - newNode.Labels[k] = nodeName - } - } - newNode.Name = nodeName - newNode.Spec.Taints = taints.SanitizeTaints(newNode.Spec.Taints, taintConfig) - return newNode, nil -} - -// SanitizePods cleans up pods used for node group templates -func SanitizePods(pods []*framework.PodInfo, sanitizedNode *apiv1.Node) []*framework.PodInfo { - // Update node name in pods. - sanitizedPods := make([]*framework.PodInfo, 0) - for _, pod := range pods { - sanitizedPod := pod.Pod.DeepCopy() - sanitizedPod.Spec.NodeName = sanitizedNode.Name - sanitizedPods = append(sanitizedPods, &framework.PodInfo{Pod: sanitizedPod}) - } - - return sanitizedPods -} - func hasHardInterPodAffinity(affinity *apiv1.Affinity) bool { if affinity == nil { return false diff --git a/cluster-autoscaler/core/utils/utils_test.go b/cluster-autoscaler/core/utils/utils_test.go index b63badbcc834..2613b0419a13 100644 --- a/cluster-autoscaler/core/utils/utils_test.go +++ b/cluster-autoscaler/core/utils/utils_test.go @@ -20,8 +20,6 @@ import ( "testing" "time" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/utils/taints" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "github.com/stretchr/testify/assert" @@ -29,33 +27,6 @@ import ( metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" ) -func TestSanitizePods(t *testing.T) { - pod := BuildTestPod("p1", 80, 0) - pod.Spec.NodeName = "n1" - pods := []*framework.PodInfo{{Pod: pod}} - - node := BuildTestNode("node", 1000, 1000) - - resNode, err := SanitizeNode(node, "test-group", taints.TaintConfig{}) - assert.NoError(t, err) - res := SanitizePods(pods, resNode) - assert.Equal(t, 1, len(res)) -} - -func TestSanitizeLabels(t *testing.T) { - oldNode := BuildTestNode("ng1-1", 1000, 1000) - oldNode.Labels = map[string]string{ - apiv1.LabelHostname: "abc", - "x": "y", - } - node, err := SanitizeNode(oldNode, "bzium", taints.TaintConfig{}) - assert.NoError(t, err) - assert.NotEqual(t, node.Labels[apiv1.LabelHostname], "abc", nil) - assert.Equal(t, node.Labels["x"], "y") - assert.NotEqual(t, node.Name, oldNode.Name) - assert.Equal(t, node.Labels[apiv1.LabelHostname], node.Name) -} - func TestGetNodeResource(t *testing.T) { node := BuildTestNode("n1", 1000, 2*MiB) diff --git a/cluster-autoscaler/estimator/binpacking_estimator.go b/cluster-autoscaler/estimator/binpacking_estimator.go index 55e1de431997..313155d9c2d1 100644 --- a/cluster-autoscaler/estimator/binpacking_estimator.go +++ b/cluster-autoscaler/estimator/binpacking_estimator.go @@ -21,16 +21,14 @@ import ( apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" + core_utils "k8s.io/autoscaler/cluster-autoscaler/simulator" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" - "k8s.io/autoscaler/cluster-autoscaler/utils/scheduler" "k8s.io/klog/v2" ) // BinpackingNodeEstimator estimates the number of needed nodes to handle the given amount of pods. type BinpackingNodeEstimator struct { - predicateChecker predicatechecker.PredicateChecker clusterSnapshot clustersnapshot.ClusterSnapshot limiter EstimationLimiter podOrderer EstimationPodOrderer @@ -48,9 +46,13 @@ type estimationState struct { newNodesWithPods map[string]bool } +func (s *estimationState) trackScheduledPod(pod *apiv1.Pod, nodeName string) { + s.newNodesWithPods[nodeName] = true + s.scheduledPods = append(s.scheduledPods, pod) +} + // NewBinpackingNodeEstimator builds a new BinpackingNodeEstimator. func NewBinpackingNodeEstimator( - predicateChecker predicatechecker.PredicateChecker, clusterSnapshot clustersnapshot.ClusterSnapshot, limiter EstimationLimiter, podOrderer EstimationPodOrderer, @@ -58,7 +60,6 @@ func NewBinpackingNodeEstimator( estimationAnalyserFunc EstimationAnalyserFunc, ) *BinpackingNodeEstimator { return &BinpackingNodeEstimator{ - predicateChecker: predicateChecker, clusterSnapshot: clusterSnapshot, limiter: limiter, podOrderer: podOrderer, @@ -136,16 +137,16 @@ func (e *BinpackingNodeEstimator) tryToScheduleOnExistingNodes( pod := pods[index] // Check schedulability on all nodes created during simulation - nodeName, err := e.predicateChecker.FitsAnyNodeMatching(e.clusterSnapshot, pod, func(nodeInfo *framework.NodeInfo) bool { + nodeName, err := e.clusterSnapshot.SchedulePodOnAnyNodeMatching(pod, func(nodeInfo *framework.NodeInfo) bool { return estimationState.newNodeNames[nodeInfo.Node().Name] }) - if err != nil { + if err != nil && err.Type() == clustersnapshot.NoNodesPassingPredicatesFoundError { break - } - - if err := e.tryToAddNode(estimationState, pod, nodeName); err != nil { + } else if err != nil { + // Unexpected error. return nil, err } + estimationState.trackScheduledPod(pod, nodeName) } return pods[index:], nil } @@ -160,11 +161,12 @@ func (e *BinpackingNodeEstimator) tryToScheduleOnNewNodes( if estimationState.lastNodeName != "" { // Check schedulability on only newly created node - if err := e.predicateChecker.CheckPredicates(e.clusterSnapshot, pod, estimationState.lastNodeName); err == nil { + if err := e.clusterSnapshot.SchedulePod(pod, estimationState.lastNodeName); err == nil { found = true - if err := e.tryToAddNode(estimationState, pod, estimationState.lastNodeName); err != nil { - return err - } + estimationState.trackScheduledPod(pod, estimationState.lastNodeName) + } else if err.Type() != clustersnapshot.FailingPredicateError { + // Unexpected error. + return err } } @@ -195,12 +197,13 @@ func (e *BinpackingNodeEstimator) tryToScheduleOnNewNodes( // Note that this may still fail (ex. if topology spreading with zonal topologyKey is used); // in this case we can't help the pending pod. We keep the node in clusterSnapshot to avoid // adding and removing node to snapshot for each such pod. - if err := e.predicateChecker.CheckPredicates(e.clusterSnapshot, pod, estimationState.lastNodeName); err != nil { + if err := e.clusterSnapshot.SchedulePod(pod, estimationState.lastNodeName); err != nil && err.Type() == clustersnapshot.FailingPredicateError { break - } - if err := e.tryToAddNode(estimationState, pod, estimationState.lastNodeName); err != nil { + } else if err != nil { + // Unexpected error. return err } + estimationState.trackScheduledPod(pod, estimationState.lastNodeName) } } return nil @@ -210,7 +213,7 @@ func (e *BinpackingNodeEstimator) addNewNodeToSnapshot( estimationState *estimationState, template *framework.NodeInfo, ) error { - newNodeInfo := scheduler.DeepCopyTemplateNode(template, fmt.Sprintf("e-%d", estimationState.newNodeNameIndex)) + newNodeInfo := core_utils.FreshNodeInfoFromTemplateNodeInfo(template, fmt.Sprintf("e-%d", estimationState.newNodeNameIndex)) if err := e.clusterSnapshot.AddNodeInfo(newNodeInfo); err != nil { return err } @@ -219,16 +222,3 @@ func (e *BinpackingNodeEstimator) addNewNodeToSnapshot( estimationState.newNodeNames[estimationState.lastNodeName] = true return nil } - -func (e *BinpackingNodeEstimator) tryToAddNode( - estimationState *estimationState, - pod *apiv1.Pod, - nodeName string, -) error { - if err := e.clusterSnapshot.ForceAddPod(pod, nodeName); err != nil { - return fmt.Errorf("Error adding pod %v.%v to node %v in ClusterSnapshot; %v", pod.Namespace, pod.Name, nodeName, err) - } - estimationState.newNodesWithPods[nodeName] = true - estimationState.scheduledPods = append(estimationState.scheduledPods, pod) - return nil -} diff --git a/cluster-autoscaler/estimator/binpacking_estimator_test.go b/cluster-autoscaler/estimator/binpacking_estimator_test.go index e0205ffdc854..ac205f16ba46 100644 --- a/cluster-autoscaler/estimator/binpacking_estimator_test.go +++ b/cluster-autoscaler/estimator/binpacking_estimator_test.go @@ -20,17 +20,15 @@ import ( "testing" "time" + "github.com/stretchr/testify/assert" + apiv1 "k8s.io/api/core/v1" "k8s.io/apimachinery/pkg/api/resource" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/autoscaler/cluster-autoscaler/utils/units" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" ) func makePodEquivalenceGroup(pod *apiv1.Pod, podCount int) PodEquivalenceGroup { @@ -66,8 +64,6 @@ func makeNode(cpu, mem, podCount int64, name string, zone string) *apiv1.Node { } func TestBinpackingEstimate(t *testing.T) { - schedulermetrics.Register() - highResourcePodGroup := makePodEquivalenceGroup( BuildTestPod( "estimatee", @@ -212,16 +208,14 @@ func TestBinpackingEstimate(t *testing.T) { } for _, tc := range testCases { t.Run(tc.name, func(t *testing.T) { - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(t) // Add one node in different zone to trigger topology spread constraints err := clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(makeNode(100, 100, 10, "oldnode", "zone-jupiter"))) assert.NoError(t, err) - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(t, err) limiter := NewThresholdBasedEstimationLimiter([]Threshold{NewStaticThreshold(tc.maxNodes, time.Duration(0))}) processor := NewDecreasingPodOrderer() - estimator := NewBinpackingNodeEstimator(predicateChecker, clusterSnapshot, limiter, processor, nil /* EstimationContext */, nil /* EstimationAnalyserFunc */) + estimator := NewBinpackingNodeEstimator(clusterSnapshot, limiter, processor, nil /* EstimationContext */, nil /* EstimationAnalyserFunc */) node := makeNode(tc.millicores, tc.memory, 10, "template", "zone-mars") nodeInfo := framework.NewTestNodeInfo(node) @@ -268,15 +262,13 @@ func BenchmarkBinpackingEstimate(b *testing.B) { } for i := 0; i < b.N; i++ { - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(b) err := clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(makeNode(100, 100, 10, "oldnode", "zone-jupiter"))) assert.NoError(b, err) - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(b, err) limiter := NewThresholdBasedEstimationLimiter([]Threshold{NewStaticThreshold(maxNodes, time.Duration(0))}) processor := NewDecreasingPodOrderer() - estimator := NewBinpackingNodeEstimator(predicateChecker, clusterSnapshot, limiter, processor, nil /* EstimationContext */, nil /* EstimationAnalyserFunc */) + estimator := NewBinpackingNodeEstimator(clusterSnapshot, limiter, processor, nil /* EstimationContext */, nil /* EstimationAnalyserFunc */) node := makeNode(millicores, memory, podsPerNode, "template", "zone-mars") nodeInfo := framework.NewTestNodeInfo(node) diff --git a/cluster-autoscaler/estimator/estimator.go b/cluster-autoscaler/estimator/estimator.go index b8e3db070349..19752115a3e6 100644 --- a/cluster-autoscaler/estimator/estimator.go +++ b/cluster-autoscaler/estimator/estimator.go @@ -23,7 +23,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" ) const ( @@ -57,7 +56,7 @@ type Estimator interface { } // EstimatorBuilder creates a new estimator object. -type EstimatorBuilder func(predicatechecker.PredicateChecker, clustersnapshot.ClusterSnapshot, EstimationContext) Estimator +type EstimatorBuilder func(clustersnapshot.ClusterSnapshot, EstimationContext) Estimator // EstimationAnalyserFunc to be run at the end of the estimation logic. type EstimationAnalyserFunc func(clustersnapshot.ClusterSnapshot, cloudprovider.NodeGroup, map[string]bool) @@ -67,10 +66,9 @@ func NewEstimatorBuilder(name string, limiter EstimationLimiter, orderer Estimat switch name { case BinpackingEstimatorName: return func( - predicateChecker predicatechecker.PredicateChecker, clusterSnapshot clustersnapshot.ClusterSnapshot, context EstimationContext) Estimator { - return NewBinpackingNodeEstimator(predicateChecker, clusterSnapshot, limiter, orderer, context, estimationAnalyserFunc) + return NewBinpackingNodeEstimator(clusterSnapshot, limiter, orderer, context, estimationAnalyserFunc) }, nil } return nil, fmt.Errorf("unknown estimator: %s", name) diff --git a/cluster-autoscaler/go.mod b/cluster-autoscaler/go.mod index eae107a99bee..bfcc12bf5f19 100644 --- a/cluster-autoscaler/go.mod +++ b/cluster-autoscaler/go.mod @@ -233,64 +233,5 @@ replace github.com/digitalocean/godo => github.com/digitalocean/godo v1.27.0 replace github.com/rancher/go-rancher => github.com/rancher/go-rancher v0.1.0 -replace k8s.io/api => k8s.io/api v0.32.0-alpha.3 - -replace k8s.io/apiextensions-apiserver => k8s.io/apiextensions-apiserver v0.32.0-alpha.3 - -replace k8s.io/apimachinery => k8s.io/apimachinery v0.32.0-alpha.3 - -replace k8s.io/apiserver => k8s.io/apiserver v0.32.0-alpha.3 - -replace k8s.io/cli-runtime => k8s.io/cli-runtime v0.32.0-alpha.3 - -replace k8s.io/client-go => k8s.io/client-go v0.32.0-alpha.3 - -replace k8s.io/cloud-provider => k8s.io/cloud-provider v0.32.0-alpha.3 - -replace k8s.io/cluster-bootstrap => k8s.io/cluster-bootstrap v0.32.0-alpha.3 - -replace k8s.io/code-generator => k8s.io/code-generator v0.32.0-alpha.3 - -replace k8s.io/component-base => k8s.io/component-base v0.32.0-alpha.3 - -replace k8s.io/component-helpers => k8s.io/component-helpers v0.32.0-alpha.3 - -replace k8s.io/controller-manager => k8s.io/controller-manager v0.32.0-alpha.3 - -replace k8s.io/cri-api => k8s.io/cri-api v0.32.0-alpha.3 - -replace k8s.io/csi-translation-lib => k8s.io/csi-translation-lib v0.32.0-alpha.3 - -replace k8s.io/kube-aggregator => k8s.io/kube-aggregator v0.32.0-alpha.3 - -replace k8s.io/kube-controller-manager => k8s.io/kube-controller-manager v0.32.0-alpha.3 - -replace k8s.io/kube-proxy => k8s.io/kube-proxy v0.32.0-alpha.3 - -replace k8s.io/kube-scheduler => k8s.io/kube-scheduler v0.32.0-alpha.3 - -replace k8s.io/kubectl => k8s.io/kubectl v0.32.0-alpha.3 - -replace k8s.io/kubelet => k8s.io/kubelet v0.32.0-alpha.3 - -replace k8s.io/metrics => k8s.io/metrics v0.32.0-alpha.3 - -replace k8s.io/mount-utils => k8s.io/mount-utils v0.32.0-alpha.3 - -replace k8s.io/sample-apiserver => k8s.io/sample-apiserver v0.32.0-alpha.3 - -replace k8s.io/sample-cli-plugin => k8s.io/sample-cli-plugin v0.32.0-alpha.3 - -replace k8s.io/sample-controller => k8s.io/sample-controller v0.32.0-alpha.3 - -replace k8s.io/pod-security-admission => k8s.io/pod-security-admission v0.32.0-alpha.3 - -replace k8s.io/dynamic-resource-allocation => k8s.io/dynamic-resource-allocation v0.32.0-alpha.3 - -replace k8s.io/kms => k8s.io/kms v0.32.0-alpha.3 - -replace k8s.io/endpointslice => k8s.io/endpointslice v0.32.0-alpha.3 - replace k8s.io/autoscaler/cluster-autoscaler/apis => ./apis -replace k8s.io/cri-client => k8s.io/cri-client v0.32.0-alpha.3 diff --git a/cluster-autoscaler/main.go b/cluster-autoscaler/main.go index cf3ca31ccbe5..21d711743896 100644 --- a/cluster-autoscaler/main.go +++ b/cluster-autoscaler/main.go @@ -28,6 +28,8 @@ import ( "syscall" "time" + "github.com/spf13/pflag" + "k8s.io/autoscaler/cluster-autoscaler/core/scaledown/actuation" "k8s.io/autoscaler/cluster-autoscaler/core/scaleup/orchestrator" "k8s.io/autoscaler/cluster-autoscaler/debuggingsnapshot" @@ -35,12 +37,12 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/besteffortatomic" "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/checkcapacity" "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/provreqclient" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/predicate" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/simulator/scheduling" kubelet_config "k8s.io/kubernetes/pkg/kubelet/apis/config" - "github.com/spf13/pflag" - "k8s.io/apimachinery/pkg/api/meta" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/apiserver/pkg/server/mux" @@ -68,7 +70,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/processors/scaledowncandidates/previouscandidates" "k8s.io/autoscaler/cluster-autoscaler/processors/status" provreqorchestrator "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/orchestrator" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/drainability/rules" "k8s.io/autoscaler/cluster-autoscaler/simulator/options" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" @@ -88,7 +89,6 @@ import ( "k8s.io/component-base/metrics/legacyregistry" "k8s.io/klog/v2" scheduler_config "k8s.io/kubernetes/pkg/scheduler/apis/config" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) // MultiStringFlag is a flag for passing multiple parameters using same flag @@ -280,6 +280,7 @@ var ( checkCapacityProvisioningRequestMaxBatchSize = flag.Int("check-capacity-provisioning-request-max-batch-size", 10, "Maximum number of provisioning requests to process in a single batch.") checkCapacityProvisioningRequestBatchTimebox = flag.Duration("check-capacity-provisioning-request-batch-timebox", 10*time.Second, "Maximum time to process a batch of provisioning requests.") forceDeleteLongUnregisteredNodes = flag.Bool("force-delete-unregistered-nodes", false, "Whether to enable force deletion of long unregistered nodes, regardless of the min size of the node group the belong to.") + enableDynamicResourceAllocation = flag.Bool("enable-dynamic-resource-allocation", false, "Whether logic for handling DRA (Dynamic Resource Allocation) objects is enabled.") ) func isFlagPassed(name string) bool { @@ -459,6 +460,7 @@ func createAutoscalingOptions() config.AutoscalingOptions { CheckCapacityProvisioningRequestMaxBatchSize: *checkCapacityProvisioningRequestMaxBatchSize, CheckCapacityProvisioningRequestBatchTimebox: *checkCapacityProvisioningRequestBatchTimebox, ForceDeleteLongUnregisteredNodes: *forceDeleteLongUnregisteredNodes, + DynamicResourceAllocationEnabled: *enableDynamicResourceAllocation, } } @@ -494,7 +496,7 @@ func buildAutoscaler(context ctx.Context, debuggingSnapshotter debuggingsnapshot } informerFactory := informers.NewSharedInformerFactoryWithOptions(kubeClient, 0, informers.WithTransform(trim)) - predicateChecker, err := predicatechecker.NewSchedulerBasedPredicateChecker(informerFactory, autoscalingOptions.SchedulerConfig) + fwHandle, err := framework.NewHandle(informerFactory, autoscalingOptions.SchedulerConfig, autoscalingOptions.DynamicResourceAllocationEnabled) if err != nil { return nil, nil, err } @@ -503,11 +505,11 @@ func buildAutoscaler(context ctx.Context, debuggingSnapshotter debuggingsnapshot opts := core.AutoscalerOptions{ AutoscalingOptions: autoscalingOptions, - ClusterSnapshot: clustersnapshot.NewDeltaClusterSnapshot(), + FrameworkHandle: fwHandle, + ClusterSnapshot: predicate.NewPredicateSnapshot(base.NewDeltaSnapshotBase(), fwHandle, autoscalingOptions.DynamicResourceAllocationEnabled), KubeClient: kubeClient, InformerFactory: informerFactory, DebuggingSnapshotter: debuggingSnapshotter, - PredicateChecker: predicateChecker, DeleteOptions: deleteOptions, DrainabilityRules: drainabilityRules, ScaleUpOrchestrator: orchestrator.New(), @@ -515,7 +517,7 @@ func buildAutoscaler(context ctx.Context, debuggingSnapshotter debuggingsnapshot opts.Processors = ca_processors.DefaultProcessors(autoscalingOptions) opts.Processors.TemplateNodeInfoProvider = nodeinfosprovider.NewDefaultTemplateNodeInfoProvider(nodeInfoCacheExpireTime, *forceDaemonSets) - podListProcessor := podlistprocessor.NewDefaultPodListProcessor(opts.PredicateChecker, scheduling.ScheduleAnywhere) + podListProcessor := podlistprocessor.NewDefaultPodListProcessor(scheduling.ScheduleAnywhere) var ProvisioningRequestInjector *provreq.ProvisioningRequestPodsInjector if autoscalingOptions.ProvisioningRequestEnabled { @@ -546,7 +548,7 @@ func buildAutoscaler(context ctx.Context, debuggingSnapshotter debuggingsnapshot scaleUpOrchestrator := provreqorchestrator.NewWrapperOrchestrator(provreqOrchestrator) opts.ScaleUpOrchestrator = scaleUpOrchestrator - provreqProcesor := provreq.NewProvReqProcessor(client, opts.PredicateChecker) + provreqProcesor := provreq.NewProvReqProcessor(client) opts.LoopStartNotifier = loopstart.NewObserversList([]loopstart.Observer{provreqProcesor}) podListProcessor.AddProcessor(provreqProcesor) @@ -632,7 +634,6 @@ func buildAutoscaler(context ctx.Context, debuggingSnapshotter debuggingsnapshot } func run(healthCheck *metrics.HealthCheck, debuggingSnapshotter debuggingsnapshot.DebuggingSnapshotter) { - schedulermetrics.Register() metrics.RegisterAll(*emitPerNodeGroupMetrics) context, cancel := ctx.WithCancel(ctx.Background()) defer cancel() diff --git a/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor.go b/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor.go index 8b0ebd58571a..34f486392099 100644 --- a/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor.go +++ b/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor.go @@ -24,7 +24,6 @@ import ( apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/cloudprovider" "k8s.io/autoscaler/cluster-autoscaler/context" - "k8s.io/autoscaler/cluster-autoscaler/core/utils" "k8s.io/autoscaler/cluster-autoscaler/simulator" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/utils/errors" @@ -78,11 +77,6 @@ func (p *MixedTemplateNodeInfoProvider) Process(ctx *context.AutoscalingContext, result := make(map[string]*framework.NodeInfo) seenGroups := make(map[string]bool) - podsForNodes, err := getPodsForNodes(ctx.ListerRegistry) - if err != nil { - return map[string]*framework.NodeInfo{}, err - } - // processNode returns information whether the nodeTemplate was generated and if there was an error. processNode := func(node *apiv1.Node) (bool, string, errors.AutoscalerError) { nodeGroup, err := ctx.CloudProvider.NodeGroupForNode(node) @@ -94,22 +88,15 @@ func (p *MixedTemplateNodeInfoProvider) Process(ctx *context.AutoscalingContext, } id := nodeGroup.Id() if _, found := result[id]; !found { - // Build nodeInfo. - sanitizedNode, err := utils.SanitizeNode(node, id, taintConfig) + nodeInfo, err := ctx.ClusterSnapshot.GetNodeInfo(node.Name) if err != nil { - return false, "", err + return false, "", errors.NewAutoscalerError(errors.InternalError, "error while retrieving node %s from cluster snapshot - this shouldn't happen: %v", node.Name, err) } - nodeInfo, err := simulator.BuildNodeInfoForNode(sanitizedNode, podsForNodes[node.Name], daemonsets, p.forceDaemonSets) + templateNodeInfo, caErr := simulator.TemplateNodeInfoFromExampleNodeInfo(nodeInfo, id, daemonsets, p.forceDaemonSets, taintConfig) if err != nil { - return false, "", err - } - - var pods []*apiv1.Pod - for _, podInfo := range nodeInfo.Pods() { - pods = append(pods, podInfo.Pod) + return false, "", caErr } - sanitizedNodeInfo := framework.NewNodeInfo(sanitizedNode, nil, utils.SanitizePods(nodeInfo.Pods(), sanitizedNode)...) - result[id] = sanitizedNodeInfo + result[id] = templateNodeInfo return true, id, nil } return false, "", nil @@ -125,7 +112,7 @@ func (p *MixedTemplateNodeInfoProvider) Process(ctx *context.AutoscalingContext, return map[string]*framework.NodeInfo{}, typedErr } if added && p.nodeInfoCache != nil { - nodeInfoCopy := utils.DeepCopyNodeInfo(result[id]) + nodeInfoCopy := result[id].DeepCopy() p.nodeInfoCache[id] = cacheItem{NodeInfo: nodeInfoCopy, added: time.Now()} } } @@ -142,7 +129,7 @@ func (p *MixedTemplateNodeInfoProvider) Process(ctx *context.AutoscalingContext, if p.isCacheItemExpired(cacheItem.added) { delete(p.nodeInfoCache, id) } else { - result[id] = utils.DeepCopyNodeInfo(cacheItem.NodeInfo) + result[id] = cacheItem.NodeInfo.DeepCopy() continue } } @@ -150,7 +137,7 @@ func (p *MixedTemplateNodeInfoProvider) Process(ctx *context.AutoscalingContext, // No good template, trying to generate one. This is called only if there are no // working nodes in the node groups. By default CA tries to use a real-world example. - nodeInfo, err := utils.GetNodeInfoFromTemplate(nodeGroup, daemonsets, taintConfig) + nodeInfo, err := simulator.TemplateNodeInfoFromNodeGroupTemplate(nodeGroup, daemonsets, taintConfig) if err != nil { if err == cloudprovider.ErrNotImplemented { continue @@ -192,19 +179,6 @@ func (p *MixedTemplateNodeInfoProvider) Process(ctx *context.AutoscalingContext, return result, nil } -func getPodsForNodes(listers kube_util.ListerRegistry) (map[string][]*apiv1.Pod, errors.AutoscalerError) { - pods, err := listers.AllPodLister().List() - if err != nil { - return nil, errors.ToAutoscalerError(errors.ApiCallError, err) - } - scheduledPods := kube_util.ScheduledPods(pods) - podsForNodes := map[string][]*apiv1.Pod{} - for _, p := range scheduledPods { - podsForNodes[p.Spec.NodeName] = append(podsForNodes[p.Spec.NodeName], p) - } - return podsForNodes, nil -} - func isNodeGoodTemplateCandidate(node *apiv1.Node, now time.Time) bool { ready, lastTransitionTime, _ := kube_util.GetReadinessState(node) stable := lastTransitionTime.Add(stabilizationDelay).Before(now) diff --git a/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor_test.go b/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor_test.go index 68e04752a8dc..fa631f18466b 100644 --- a/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor_test.go +++ b/cluster-autoscaler/processors/nodeinfosprovider/mixed_nodeinfos_processor_test.go @@ -20,18 +20,18 @@ import ( "testing" "time" + "github.com/stretchr/testify/assert" + + appsv1 "k8s.io/api/apps/v1" + apiv1 "k8s.io/api/core/v1" testprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/test" "k8s.io/autoscaler/cluster-autoscaler/context" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" "k8s.io/autoscaler/cluster-autoscaler/utils/taints" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" - appsv1 "k8s.io/api/apps/v1" - apiv1 "k8s.io/api/core/v1" ) var ( @@ -39,8 +39,6 @@ var ( ) func TestGetNodeInfosForGroups(t *testing.T) { - schedulermetrics.Register() - now := time.Now() ready1 := BuildTestNode("n1", 1000, 1000) SetNodeReadyState(ready1, true, now.Add(-2*time.Minute)) @@ -78,17 +76,19 @@ func TestGetNodeInfosForGroups(t *testing.T) { podLister := kube_util.NewTestPodLister([]*apiv1.Pod{}) registry := kube_util.NewListerRegistry(nil, nil, podLister, nil, nil, nil, nil, nil, nil) - predicateChecker, err := predicatechecker.NewTestPredicateChecker() + nodes := []*apiv1.Node{justReady5, unready4, unready3, ready2, ready1} + snapshot := testsnapshot.NewTestSnapshotOrDie(t) + err := snapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) assert.NoError(t, err) ctx := context.AutoscalingContext{ - CloudProvider: provider1, - PredicateChecker: predicateChecker, + CloudProvider: provider1, + ClusterSnapshot: snapshot, AutoscalingKubeClients: context.AutoscalingKubeClients{ ListerRegistry: registry, }, } - res, err := NewMixedTemplateNodeInfoProvider(&cacheTtl, false).Process(&ctx, []*apiv1.Node{justReady5, unready4, unready3, ready2, ready1}, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) + res, err := NewMixedTemplateNodeInfoProvider(&cacheTtl, false).Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) assert.Equal(t, 5, len(res)) info, found := res["ng1"] @@ -109,8 +109,8 @@ func TestGetNodeInfosForGroups(t *testing.T) { // Test for a nodegroup without nodes and TemplateNodeInfo not implemented by cloud proivder ctx = context.AutoscalingContext{ - CloudProvider: provider2, - PredicateChecker: predicateChecker, + CloudProvider: provider2, + ClusterSnapshot: testsnapshot.NewTestSnapshotOrDie(t), AutoscalingKubeClients: context.AutoscalingKubeClients{ ListerRegistry: registry, }, @@ -162,19 +162,21 @@ func TestGetNodeInfosForGroupsCache(t *testing.T) { podLister := kube_util.NewTestPodLister([]*apiv1.Pod{}) registry := kube_util.NewListerRegistry(nil, nil, podLister, nil, nil, nil, nil, nil, nil) - predicateChecker, err := predicatechecker.NewTestPredicateChecker() + nodes := []*apiv1.Node{unready4, unready3, ready2, ready1} + snapshot := testsnapshot.NewTestSnapshotOrDie(t) + err := snapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) assert.NoError(t, err) // Fill cache ctx := context.AutoscalingContext{ - CloudProvider: provider1, - PredicateChecker: predicateChecker, + CloudProvider: provider1, + ClusterSnapshot: snapshot, AutoscalingKubeClients: context.AutoscalingKubeClients{ ListerRegistry: registry, }, } niProcessor := NewMixedTemplateNodeInfoProvider(&cacheTtl, false) - res, err := niProcessor.Process(&ctx, []*apiv1.Node{unready4, unready3, ready2, ready1}, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) + res, err := niProcessor.Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) // Check results assert.Equal(t, 4, len(res)) @@ -208,7 +210,7 @@ func TestGetNodeInfosForGroupsCache(t *testing.T) { assert.Equal(t, "ng3", lastDeletedGroup) // Check cache with all nodes removed - res, err = niProcessor.Process(&ctx, []*apiv1.Node{unready4, unready3, ready2, ready1}, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) + res, err = niProcessor.Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) // Check results assert.Equal(t, 2, len(res)) @@ -229,7 +231,7 @@ func TestGetNodeInfosForGroupsCache(t *testing.T) { // Fill cache manually infoNg4Node6 := framework.NewTestNodeInfo(ready6.DeepCopy()) niProcessor.nodeInfoCache = map[string]cacheItem{"ng4": {NodeInfo: infoNg4Node6, added: now}} - res, err = niProcessor.Process(&ctx, []*apiv1.Node{unready4, unready3, ready2, ready1}, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) + res, err = niProcessor.Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) // Check if cache was used assert.NoError(t, err) assert.Equal(t, 2, len(res)) @@ -250,12 +252,15 @@ func TestGetNodeInfosCacheExpired(t *testing.T) { provider := testprovider.NewTestAutoprovisioningCloudProvider(nil, nil, nil, nil, nil, nil) podLister := kube_util.NewTestPodLister([]*apiv1.Pod{}) registry := kube_util.NewListerRegistry(nil, nil, podLister, nil, nil, nil, nil, nil, nil) - predicateChecker, err := predicatechecker.NewTestPredicateChecker() + + nodes := []*apiv1.Node{ready1} + snapshot := testsnapshot.NewTestSnapshotOrDie(t) + err := snapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) assert.NoError(t, err) ctx := context.AutoscalingContext{ - CloudProvider: provider, - PredicateChecker: predicateChecker, + CloudProvider: provider, + ClusterSnapshot: snapshot, AutoscalingKubeClients: context.AutoscalingKubeClients{ ListerRegistry: registry, }, @@ -272,7 +277,7 @@ func TestGetNodeInfosCacheExpired(t *testing.T) { provider.AddNode("ng1", ready1) assert.Equal(t, 2, len(niProcessor1.nodeInfoCache)) - _, err = niProcessor1.Process(&ctx, []*apiv1.Node{ready1}, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) + _, err = niProcessor1.Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) assert.Equal(t, 1, len(niProcessor1.nodeInfoCache)) @@ -283,7 +288,7 @@ func TestGetNodeInfosCacheExpired(t *testing.T) { "ng2": {NodeInfo: tni, added: now.Add(-2 * time.Second)}, } assert.Equal(t, 2, len(niProcessor2.nodeInfoCache)) - _, err = niProcessor1.Process(&ctx, []*apiv1.Node{ready1}, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) + _, err = niProcessor1.Process(&ctx, nodes, []*appsv1.DaemonSet{}, taints.TaintConfig{}, now) assert.NoError(t, err) assert.Equal(t, 2, len(niProcessor2.nodeInfoCache)) diff --git a/cluster-autoscaler/processors/nodes/scale_down_set_processor_test.go b/cluster-autoscaler/processors/nodes/scale_down_set_processor_test.go index dc43792c7183..af18b0ef072e 100644 --- a/cluster-autoscaler/processors/nodes/scale_down_set_processor_test.go +++ b/cluster-autoscaler/processors/nodes/scale_down_set_processor_test.go @@ -20,17 +20,16 @@ import ( "testing" "github.com/stretchr/testify/assert" + testprovider "k8s.io/autoscaler/cluster-autoscaler/cloudprovider/test" "k8s.io/autoscaler/cluster-autoscaler/config" . "k8s.io/autoscaler/cluster-autoscaler/core/test" "k8s.io/autoscaler/cluster-autoscaler/simulator" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/client-go/kubernetes/fake" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) func TestAtomicResizeFilterUnremovableNodes(t *testing.T) { - schedulermetrics.Register() testCases := []struct { name string nodeGroups []struct { diff --git a/cluster-autoscaler/processors/podinjection/pod_injection_processor_test.go b/cluster-autoscaler/processors/podinjection/pod_injection_processor_test.go index 13a98c8d78c8..426da16c68d1 100644 --- a/cluster-autoscaler/processors/podinjection/pod_injection_processor_test.go +++ b/cluster-autoscaler/processors/podinjection/pod_injection_processor_test.go @@ -28,7 +28,8 @@ import ( "k8s.io/apimachinery/pkg/types" "k8s.io/autoscaler/cluster-autoscaler/context" podinjectionbackoff "k8s.io/autoscaler/cluster-autoscaler/processors/podinjection/backoff" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" @@ -112,7 +113,7 @@ func TestTargetCountInjectionPodListProcessor(t *testing.T) { for _, tc := range testCases { t.Run(tc.name, func(t *testing.T) { p := NewPodInjectionPodListProcessor(podinjectionbackoff.NewFakePodControllerRegistry()) - clusterSnapshot := clustersnapshot.NewDeltaClusterSnapshot() + clusterSnapshot := testsnapshot.NewCustomTestSnapshotOrDie(t, base.NewDeltaSnapshotBase()) err := clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(node, tc.scheduledPods...)) assert.NoError(t, err) ctx := context.AutoscalingContext{ diff --git a/cluster-autoscaler/processors/provreq/processor.go b/cluster-autoscaler/processors/provreq/processor.go index 56f52257547c..1463b1e9f6db 100644 --- a/cluster-autoscaler/processors/provreq/processor.go +++ b/cluster-autoscaler/processors/provreq/processor.go @@ -32,7 +32,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/provreqwrapper" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/simulator/scheduling" "k8s.io/autoscaler/cluster-autoscaler/utils/klogx" "k8s.io/klog/v2" @@ -58,8 +57,8 @@ type provReqProcessor struct { } // NewProvReqProcessor return ProvisioningRequestProcessor. -func NewProvReqProcessor(client *provreqclient.ProvisioningRequestClient, predicateChecker predicatechecker.PredicateChecker) *provReqProcessor { - return &provReqProcessor{now: time.Now, maxUpdated: defaultMaxUpdated, client: client, injector: scheduling.NewHintingSimulator(predicateChecker)} +func NewProvReqProcessor(client *provreqclient.ProvisioningRequestClient) *provReqProcessor { + return &provReqProcessor{now: time.Now, maxUpdated: defaultMaxUpdated, client: client, injector: scheduling.NewHintingSimulator()} } // Refresh implements loop.Observer interface and will be run at the start diff --git a/cluster-autoscaler/processors/provreq/processor_test.go b/cluster-autoscaler/processors/provreq/processor_test.go index 20eaa0e1ffba..11daf0aa2590 100644 --- a/cluster-autoscaler/processors/provreq/processor_test.go +++ b/cluster-autoscaler/processors/provreq/processor_test.go @@ -22,11 +22,9 @@ import ( "time" "github.com/stretchr/testify/assert" + apiv1 "k8s.io/api/core/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - v1 "k8s.io/autoscaler/cluster-autoscaler/apis/provisioningrequest/autoscaling.x-k8s.io/v1" "k8s.io/autoscaler/cluster-autoscaler/config" . "k8s.io/autoscaler/cluster-autoscaler/core/test" @@ -34,6 +32,7 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/provreqclient" "k8s.io/autoscaler/cluster-autoscaler/provisioningrequest/provreqwrapper" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/simulator/scheduling" ) @@ -239,8 +238,6 @@ func (f *fakeInjector) TrySchedulePods(clusterSnapshot clustersnapshot.ClusterSn } func TestBookCapacity(t *testing.T) { - schedulermetrics.Register() - testCases := []struct { name string conditions []string diff --git a/cluster-autoscaler/processors/test/common.go b/cluster-autoscaler/processors/test/common.go index dd45d6569f91..07f69c16a346 100644 --- a/cluster-autoscaler/processors/test/common.go +++ b/cluster-autoscaler/processors/test/common.go @@ -39,7 +39,7 @@ import ( // NewTestProcessors returns a set of simple processors for use in tests. func NewTestProcessors(context *context.AutoscalingContext) *processors.AutoscalingProcessors { return &processors.AutoscalingProcessors{ - PodListProcessor: podlistprocessor.NewDefaultPodListProcessor(context.PredicateChecker, scheduling.ScheduleAnywhere), + PodListProcessor: podlistprocessor.NewDefaultPodListProcessor(scheduling.ScheduleAnywhere), NodeGroupListProcessor: &nodegroups.NoOpNodeGroupListProcessor{}, BinpackingLimiter: binpacking.NewTimeLimiter(context.MaxNodeGroupBinpackingDuration), NodeGroupSetProcessor: nodegroupset.NewDefaultNodeGroupSetProcessor([]string{}, config.NodeGroupDifferenceRatios{}), diff --git a/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator.go b/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator.go index 4008b5992246..6174749c46d7 100644 --- a/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator.go +++ b/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator.go @@ -69,7 +69,7 @@ func (o *provReqOrchestrator) Initialize( ) { o.initialized = true o.context = autoscalingContext - o.injector = scheduling.NewHintingSimulator(autoscalingContext.PredicateChecker) + o.injector = scheduling.NewHintingSimulator() for _, mode := range o.provisioningClasses { mode.Initialize(autoscalingContext, processors, clusterStateRegistry, estimatorBuilder, taintConfig, o.injector) } diff --git a/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator_test.go b/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator_test.go index ba6a8e684a17..414cd43c16a7 100644 --- a/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator_test.go +++ b/cluster-autoscaler/provisioningrequest/orchestrator/orchestrator_test.go @@ -49,13 +49,9 @@ import ( . "k8s.io/autoscaler/cluster-autoscaler/utils/test" "k8s.io/client-go/kubernetes/fake" clocktesting "k8s.io/utils/clock/testing" - - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" ) func TestScaleUp(t *testing.T) { - schedulermetrics.Register() - // Set up a cluster with 200 nodes: // - 100 nodes with high cpu, low memory in autoscaled group with max 150 // - 100 nodes with high memory, low cpu not in autoscaled group diff --git a/cluster-autoscaler/simulator/cluster.go b/cluster-autoscaler/simulator/cluster.go index e81d9ecea0ff..36fa10ff3be9 100644 --- a/cluster-autoscaler/simulator/cluster.go +++ b/cluster-autoscaler/simulator/cluster.go @@ -26,7 +26,6 @@ import ( "k8s.io/autoscaler/cluster-autoscaler/simulator/drainability/rules" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/simulator/options" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/simulator/scheduling" "k8s.io/autoscaler/cluster-autoscaler/utils/drain" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" @@ -105,15 +104,14 @@ type RemovalSimulator struct { } // NewRemovalSimulator returns a new RemovalSimulator. -func NewRemovalSimulator(listers kube_util.ListerRegistry, clusterSnapshot clustersnapshot.ClusterSnapshot, predicateChecker predicatechecker.PredicateChecker, - deleteOptions options.NodeDeleteOptions, drainabilityRules rules.Rules, persistSuccessfulSimulations bool) *RemovalSimulator { +func NewRemovalSimulator(listers kube_util.ListerRegistry, clusterSnapshot clustersnapshot.ClusterSnapshot, deleteOptions options.NodeDeleteOptions, drainabilityRules rules.Rules, persistSuccessfulSimulations bool) *RemovalSimulator { return &RemovalSimulator{ listers: listers, clusterSnapshot: clusterSnapshot, canPersist: persistSuccessfulSimulations, deleteOptions: deleteOptions, drainabilityRules: drainabilityRules, - schedulingSimulator: scheduling.NewHintingSimulator(predicateChecker), + schedulingSimulator: scheduling.NewHintingSimulator(), } } @@ -223,7 +221,7 @@ func (r *RemovalSimulator) findPlaceFor(removedNode string, pods []*apiv1.Pod, n // remove pods from clusterSnapshot first for _, pod := range pods { - if err := r.clusterSnapshot.ForceRemovePod(pod.Namespace, pod.Name, removedNode); err != nil { + if err := r.clusterSnapshot.UnschedulePod(pod.Namespace, pod.Name, removedNode); err != nil { // just log error klog.Errorf("Simulating removal of %s/%s return error; %v", pod.Namespace, pod.Name, err) } diff --git a/cluster-autoscaler/simulator/cluster_test.go b/cluster-autoscaler/simulator/cluster_test.go index e493a6672b02..2fbf1f55973f 100644 --- a/cluster-autoscaler/simulator/cluster_test.go +++ b/cluster-autoscaler/simulator/cluster_test.go @@ -21,19 +21,18 @@ import ( "testing" "time" + "github.com/stretchr/testify/assert" + + appsv1 "k8s.io/api/apps/v1" + apiv1 "k8s.io/api/core/v1" + metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/autoscaler/cluster-autoscaler/simulator/options" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/utils/drain" kube_util "k8s.io/autoscaler/cluster-autoscaler/utils/kubernetes" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" - appsv1 "k8s.io/api/apps/v1" - apiv1 "k8s.io/api/core/v1" - metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/kubernetes/pkg/kubelet/types" ) @@ -57,10 +56,10 @@ func TestFindEmptyNodes(t *testing.T) { types.ConfigMirrorAnnotationKey: "", } - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(t) clustersnapshot.InitializeClusterSnapshotOrDie(t, clusterSnapshot, []*apiv1.Node{nodes[0], nodes[1], nodes[2], nodes[3]}, []*apiv1.Pod{pod1, pod2}) testTime := time.Date(2020, time.December, 18, 17, 0, 0, 0, time.UTC) - r := NewRemovalSimulator(nil, clusterSnapshot, nil, testDeleteOptions(), nil, false) + r := NewRemovalSimulator(nil, clusterSnapshot, testDeleteOptions(), nil, false) emptyNodes := r.FindEmptyNodesToRemove(nodeNames, testTime) assert.Equal(t, []string{nodeNames[0], nodeNames[2], nodeNames[3]}, emptyNodes) } @@ -75,8 +74,6 @@ type findNodesToRemoveTestConfig struct { } func TestFindNodesToRemove(t *testing.T) { - schedulermetrics.Register() - emptyNode := BuildTestNode("n1", 1000, 2000000) // two small pods backed by ReplicaSet @@ -141,9 +138,7 @@ func TestFindNodesToRemove(t *testing.T) { PodsToReschedule: []*apiv1.Pod{pod1, pod2}, } - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(t, err) + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(t) tests := []findNodesToRemoveTestConfig{ { @@ -190,7 +185,7 @@ func TestFindNodesToRemove(t *testing.T) { destinations = append(destinations, node.Name) } clustersnapshot.InitializeClusterSnapshotOrDie(t, clusterSnapshot, test.allNodes, test.pods) - r := NewRemovalSimulator(registry, clusterSnapshot, predicateChecker, testDeleteOptions(), nil, false) + r := NewRemovalSimulator(registry, clusterSnapshot, testDeleteOptions(), nil, false) toRemove, unremovable := r.FindNodesToRemove(test.candidates, destinations, time.Now(), nil) fmt.Printf("Test scenario: %s, found len(toRemove)=%v, expected len(test.toRemove)=%v\n", test.name, len(toRemove), len(test.toRemove)) assert.Equal(t, test.toRemove, toRemove) diff --git a/cluster-autoscaler/simulator/clustersnapshot/basic.go b/cluster-autoscaler/simulator/clustersnapshot/base/basic.go similarity index 73% rename from cluster-autoscaler/simulator/clustersnapshot/basic.go rename to cluster-autoscaler/simulator/clustersnapshot/base/basic.go index be8388c5ce8b..2d0bdd036995 100644 --- a/cluster-autoscaler/simulator/clustersnapshot/basic.go +++ b/cluster-autoscaler/simulator/clustersnapshot/base/basic.go @@ -14,26 +14,28 @@ See the License for the specific language governing permissions and limitations under the License. */ -package clustersnapshot +package base import ( "fmt" apiv1 "k8s.io/api/core/v1" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/klog/v2" schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" ) -// BasicClusterSnapshot is simple, reference implementation of ClusterSnapshot. +// BasicSnapshotBase is simple, reference implementation of SnapshotBase. // It is inefficient. But hopefully bug-free and good for initial testing. -type BasicClusterSnapshot struct { +type BasicSnapshotBase struct { data []*internalBasicSnapshotData } type internalBasicSnapshotData struct { nodeInfoMap map[string]*schedulerframework.NodeInfo pvcNamespacePodMap map[string]map[string]bool + draSnapshot drasnapshot.Snapshot } func (data *internalBasicSnapshotData) listNodeInfos() []*schedulerframework.NodeInfo { @@ -70,7 +72,7 @@ func (data *internalBasicSnapshotData) getNodeInfo(nodeName string) (*schedulerf if v, ok := data.nodeInfoMap[nodeName]; ok { return v, nil } - return nil, ErrNodeNotFound + return nil, clustersnapshot.ErrNodeNotFound } func (data *internalBasicSnapshotData) isPVCUsedByPods(key string) bool { @@ -140,6 +142,7 @@ func (data *internalBasicSnapshotData) clone() *internalBasicSnapshotData { return &internalBasicSnapshotData{ nodeInfoMap: clonedNodeInfoMap, pvcNamespacePodMap: clonedPvcNamespaceNodeMap, + draSnapshot: data.draSnapshot.Clone(), } } @@ -155,7 +158,7 @@ func (data *internalBasicSnapshotData) addNode(node *apiv1.Node) error { func (data *internalBasicSnapshotData) removeNodeInfo(nodeName string) error { if _, found := data.nodeInfoMap[nodeName]; !found { - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } for _, pod := range data.nodeInfoMap[nodeName].Pods { data.removePvcUsedByPod(pod.Pod) @@ -166,7 +169,7 @@ func (data *internalBasicSnapshotData) removeNodeInfo(nodeName string) error { func (data *internalBasicSnapshotData) addPod(pod *apiv1.Pod, nodeName string) error { if _, found := data.nodeInfoMap[nodeName]; !found { - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } data.nodeInfoMap[nodeName].AddPod(pod) data.addPvcUsedByPod(pod) @@ -176,7 +179,7 @@ func (data *internalBasicSnapshotData) addPod(pod *apiv1.Pod, nodeName string) e func (data *internalBasicSnapshotData) removePod(namespace, podName, nodeName string) error { nodeInfo, found := data.nodeInfoMap[nodeName] if !found { - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } logger := klog.Background() for _, podInfo := range nodeInfo.Pods { @@ -193,38 +196,28 @@ func (data *internalBasicSnapshotData) removePod(namespace, podName, nodeName st return fmt.Errorf("pod %s/%s not in snapshot", namespace, podName) } -// NewBasicClusterSnapshot creates instances of BasicClusterSnapshot. -func NewBasicClusterSnapshot() *BasicClusterSnapshot { - snapshot := &BasicClusterSnapshot{} +// NewBasicSnapshotBase creates instances of BasicSnapshotBase. +func NewBasicSnapshotBase() *BasicSnapshotBase { + snapshot := &BasicSnapshotBase{} snapshot.clear() return snapshot } -func (snapshot *BasicClusterSnapshot) getInternalData() *internalBasicSnapshotData { +func (snapshot *BasicSnapshotBase) getInternalData() *internalBasicSnapshotData { return snapshot.data[len(snapshot.data)-1] } -// GetNodeInfo gets a NodeInfo. -func (snapshot *BasicClusterSnapshot) GetNodeInfo(nodeName string) (*framework.NodeInfo, error) { - schedNodeInfo, err := snapshot.getInternalData().getNodeInfo(nodeName) - if err != nil { - return nil, err - } - return framework.WrapSchedulerNodeInfo(schedNodeInfo), nil -} - -// ListNodeInfos lists NodeInfos. -func (snapshot *BasicClusterSnapshot) ListNodeInfos() ([]*framework.NodeInfo, error) { - schedNodeInfos := snapshot.getInternalData().listNodeInfos() - return framework.WrapSchedulerNodeInfos(schedNodeInfos), nil +// DraSnapshot returns the DRA snapshot. +func (snapshot *BasicSnapshotBase) DraSnapshot() drasnapshot.Snapshot { + return snapshot.getInternalData().draSnapshot } -// AddNodeInfo adds a NodeInfo. -func (snapshot *BasicClusterSnapshot) AddNodeInfo(nodeInfo *framework.NodeInfo) error { +// AddSchedulerNodeInfo adds a NodeInfo. +func (snapshot *BasicSnapshotBase) AddSchedulerNodeInfo(nodeInfo *schedulerframework.NodeInfo) error { if err := snapshot.getInternalData().addNode(nodeInfo.Node()); err != nil { return err } - for _, podInfo := range nodeInfo.Pods() { + for _, podInfo := range nodeInfo.Pods { if err := snapshot.getInternalData().addPod(podInfo.Pod, nodeInfo.Node().Name); err != nil { return err } @@ -233,7 +226,7 @@ func (snapshot *BasicClusterSnapshot) AddNodeInfo(nodeInfo *framework.NodeInfo) } // SetClusterState sets the cluster state. -func (snapshot *BasicClusterSnapshot) SetClusterState(nodes []*apiv1.Node, scheduledPods []*apiv1.Pod) error { +func (snapshot *BasicSnapshotBase) SetClusterState(nodes []*apiv1.Node, scheduledPods []*apiv1.Pod, draSnapshot drasnapshot.Snapshot) error { snapshot.clear() knownNodes := make(map[string]bool) @@ -250,37 +243,38 @@ func (snapshot *BasicClusterSnapshot) SetClusterState(nodes []*apiv1.Node, sched } } } + snapshot.getInternalData().draSnapshot = draSnapshot return nil } -// RemoveNodeInfo removes nodes (and pods scheduled to it) from the snapshot. -func (snapshot *BasicClusterSnapshot) RemoveNodeInfo(nodeName string) error { +// RemoveSchedulerNodeInfo removes nodes (and pods scheduled to it) from the snapshot. +func (snapshot *BasicSnapshotBase) RemoveSchedulerNodeInfo(nodeName string) error { return snapshot.getInternalData().removeNodeInfo(nodeName) } // ForceAddPod adds pod to the snapshot and schedules it to given node. -func (snapshot *BasicClusterSnapshot) ForceAddPod(pod *apiv1.Pod, nodeName string) error { +func (snapshot *BasicSnapshotBase) ForceAddPod(pod *apiv1.Pod, nodeName string) error { return snapshot.getInternalData().addPod(pod, nodeName) } // ForceRemovePod removes pod from the snapshot. -func (snapshot *BasicClusterSnapshot) ForceRemovePod(namespace, podName, nodeName string) error { +func (snapshot *BasicSnapshotBase) ForceRemovePod(namespace, podName, nodeName string) error { return snapshot.getInternalData().removePod(namespace, podName, nodeName) } // IsPVCUsedByPods returns if the pvc is used by any pod -func (snapshot *BasicClusterSnapshot) IsPVCUsedByPods(key string) bool { +func (snapshot *BasicSnapshotBase) IsPVCUsedByPods(key string) bool { return snapshot.getInternalData().isPVCUsedByPods(key) } // Fork creates a fork of snapshot state. All modifications can later be reverted to moment of forking via Revert() -func (snapshot *BasicClusterSnapshot) Fork() { +func (snapshot *BasicSnapshotBase) Fork() { forkData := snapshot.getInternalData().clone() snapshot.data = append(snapshot.data, forkData) } // Revert reverts snapshot state to moment of forking. -func (snapshot *BasicClusterSnapshot) Revert() { +func (snapshot *BasicSnapshotBase) Revert() { if len(snapshot.data) == 1 { return } @@ -288,7 +282,7 @@ func (snapshot *BasicClusterSnapshot) Revert() { } // Commit commits changes done after forking. -func (snapshot *BasicClusterSnapshot) Commit() error { +func (snapshot *BasicSnapshotBase) Commit() error { if len(snapshot.data) <= 1 { // do nothing return nil @@ -298,47 +292,62 @@ func (snapshot *BasicClusterSnapshot) Commit() error { } // clear reset cluster snapshot to empty, unforked state -func (snapshot *BasicClusterSnapshot) clear() { +func (snapshot *BasicSnapshotBase) clear() { baseData := newInternalBasicSnapshotData() snapshot.data = []*internalBasicSnapshotData{baseData} } // implementation of SharedLister interface -type basicClusterSnapshotNodeLister BasicClusterSnapshot -type basicClusterSnapshotStorageLister BasicClusterSnapshot +type basicClusterSnapshotNodeLister BasicSnapshotBase +type basicClusterSnapshotStorageLister BasicSnapshotBase // NodeInfos exposes snapshot as NodeInfoLister. -func (snapshot *BasicClusterSnapshot) NodeInfos() schedulerframework.NodeInfoLister { +func (snapshot *BasicSnapshotBase) NodeInfos() schedulerframework.NodeInfoLister { return (*basicClusterSnapshotNodeLister)(snapshot) } // StorageInfos exposes snapshot as StorageInfoLister. -func (snapshot *BasicClusterSnapshot) StorageInfos() schedulerframework.StorageInfoLister { +func (snapshot *BasicSnapshotBase) StorageInfos() schedulerframework.StorageInfoLister { return (*basicClusterSnapshotStorageLister)(snapshot) } +// ResourceClaims exposes snapshot as ResourceClaimTracker +func (snapshot *BasicSnapshotBase) ResourceClaims() schedulerframework.ResourceClaimTracker { + return snapshot.DraSnapshot().ResourceClaims() +} + +// ResourceSlices exposes snapshot as ResourceSliceLister. +func (snapshot *BasicSnapshotBase) ResourceSlices() schedulerframework.ResourceSliceLister { + return snapshot.DraSnapshot().ResourceSlices() +} + +// DeviceClasses exposes the snapshot as DeviceClassLister. +func (snapshot *BasicSnapshotBase) DeviceClasses() schedulerframework.DeviceClassLister { + return snapshot.DraSnapshot().DeviceClasses() +} + // List returns the list of nodes in the snapshot. func (snapshot *basicClusterSnapshotNodeLister) List() ([]*schedulerframework.NodeInfo, error) { - return (*BasicClusterSnapshot)(snapshot).getInternalData().listNodeInfos(), nil + return (*BasicSnapshotBase)(snapshot).getInternalData().listNodeInfos(), nil } // HavePodsWithAffinityList returns the list of nodes with at least one pods with inter-pod affinity func (snapshot *basicClusterSnapshotNodeLister) HavePodsWithAffinityList() ([]*schedulerframework.NodeInfo, error) { - return (*BasicClusterSnapshot)(snapshot).getInternalData().listNodeInfosThatHavePodsWithAffinityList() + return (*BasicSnapshotBase)(snapshot).getInternalData().listNodeInfosThatHavePodsWithAffinityList() } // HavePodsWithRequiredAntiAffinityList returns the list of NodeInfos of nodes with pods with required anti-affinity terms. func (snapshot *basicClusterSnapshotNodeLister) HavePodsWithRequiredAntiAffinityList() ([]*schedulerframework.NodeInfo, error) { - return (*BasicClusterSnapshot)(snapshot).getInternalData().listNodeInfosThatHavePodsWithRequiredAntiAffinityList() + return (*BasicSnapshotBase)(snapshot).getInternalData().listNodeInfosThatHavePodsWithRequiredAntiAffinityList() } // Returns the NodeInfo of the given node name. func (snapshot *basicClusterSnapshotNodeLister) Get(nodeName string) (*schedulerframework.NodeInfo, error) { - return (*BasicClusterSnapshot)(snapshot).getInternalData().getNodeInfo(nodeName) + return (*BasicSnapshotBase)(snapshot).getInternalData().getNodeInfo(nodeName) } // Returns the IsPVCUsedByPods in a given key. func (snapshot *basicClusterSnapshotStorageLister) IsPVCUsedByPods(key string) bool { - return (*BasicClusterSnapshot)(snapshot).getInternalData().isPVCUsedByPods(key) + return (*BasicSnapshotBase)(snapshot).getInternalData().isPVCUsedByPods(key) } diff --git a/cluster-autoscaler/simulator/clustersnapshot/delta.go b/cluster-autoscaler/simulator/clustersnapshot/base/delta.go similarity index 81% rename from cluster-autoscaler/simulator/clustersnapshot/delta.go rename to cluster-autoscaler/simulator/clustersnapshot/base/delta.go index 869e494e0226..51ec83ba02eb 100644 --- a/cluster-autoscaler/simulator/clustersnapshot/delta.go +++ b/cluster-autoscaler/simulator/clustersnapshot/base/delta.go @@ -14,18 +14,19 @@ See the License for the specific language governing permissions and limitations under the License. */ -package clustersnapshot +package base import ( "fmt" apiv1 "k8s.io/api/core/v1" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/klog/v2" schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" ) -// DeltaClusterSnapshot is an implementation of ClusterSnapshot optimized for typical Cluster Autoscaler usage - (fork, add stuff, revert), repeated many times per loop. +// DeltaSnapshotBase is an implementation of SnapshotBase optimized for typical Cluster Autoscaler usage - (fork, add stuff, revert), repeated many times per loop. // // Complexity of some notable operations: // @@ -42,12 +43,12 @@ import ( // (when forked affects delta, but not base.) // pod affinity - causes scheduler framework to list pods with non-empty selector, // so basic caching doesn't help. -type DeltaClusterSnapshot struct { +type DeltaSnapshotBase struct { data *internalDeltaSnapshotData } -type deltaSnapshotNodeLister DeltaClusterSnapshot -type deltaSnapshotStorageLister DeltaClusterSnapshot +type deltaSnapshotNodeLister DeltaSnapshotBase +type deltaSnapshotStorageLister DeltaSnapshotBase type internalDeltaSnapshotData struct { baseData *internalDeltaSnapshotData @@ -191,7 +192,7 @@ func (data *internalDeltaSnapshotData) removeNodeInfo(nodeName string) error { if _, deleted := data.deletedNodeInfos[nodeName]; deleted { // If node was deleted within this delta, fail with error. - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } _, foundInBase := data.baseData.getNodeInfo(nodeName) @@ -202,7 +203,7 @@ func (data *internalDeltaSnapshotData) removeNodeInfo(nodeName string) error { if !foundInBase && !foundInDelta { // Node not found in the chain. - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } // Maybe consider deleting from the lists instead. Maybe not. @@ -230,7 +231,7 @@ func (data *internalDeltaSnapshotData) nodeInfoToModify(nodeName string) (*sched func (data *internalDeltaSnapshotData) addPod(pod *apiv1.Pod, nodeName string) error { ni, found := data.nodeInfoToModify(nodeName) if !found { - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } ni.AddPod(pod) @@ -246,7 +247,7 @@ func (data *internalDeltaSnapshotData) removePod(namespace, name, nodeName strin // probably means things are very bad anyway. ni, found := data.nodeInfoToModify(nodeName) if !found { - return ErrNodeNotFound + return clustersnapshot.ErrNodeNotFound } podFound := false @@ -359,61 +360,68 @@ func (snapshot *deltaSnapshotNodeLister) HavePodsWithRequiredAntiAffinityList() // Get returns node info by node name. func (snapshot *deltaSnapshotNodeLister) Get(nodeName string) (*schedulerframework.NodeInfo, error) { - return (*DeltaClusterSnapshot)(snapshot).getNodeInfo(nodeName) + return (*DeltaSnapshotBase)(snapshot).getNodeInfo(nodeName) } // IsPVCUsedByPods returns if PVC is used by pods func (snapshot *deltaSnapshotStorageLister) IsPVCUsedByPods(key string) bool { - return (*DeltaClusterSnapshot)(snapshot).IsPVCUsedByPods(key) + return (*DeltaSnapshotBase)(snapshot).IsPVCUsedByPods(key) } -func (snapshot *DeltaClusterSnapshot) getNodeInfo(nodeName string) (*schedulerframework.NodeInfo, error) { +func (snapshot *DeltaSnapshotBase) getNodeInfo(nodeName string) (*schedulerframework.NodeInfo, error) { data := snapshot.data node, found := data.getNodeInfo(nodeName) if !found { - return nil, ErrNodeNotFound + return nil, clustersnapshot.ErrNodeNotFound } return node, nil } // NodeInfos returns node lister. -func (snapshot *DeltaClusterSnapshot) NodeInfos() schedulerframework.NodeInfoLister { +func (snapshot *DeltaSnapshotBase) NodeInfos() schedulerframework.NodeInfoLister { return (*deltaSnapshotNodeLister)(snapshot) } // StorageInfos returns storage lister -func (snapshot *DeltaClusterSnapshot) StorageInfos() schedulerframework.StorageInfoLister { +func (snapshot *DeltaSnapshotBase) StorageInfos() schedulerframework.StorageInfoLister { return (*deltaSnapshotStorageLister)(snapshot) } -// NewDeltaClusterSnapshot creates instances of DeltaClusterSnapshot. -func NewDeltaClusterSnapshot() *DeltaClusterSnapshot { - snapshot := &DeltaClusterSnapshot{} - snapshot.clear() - return snapshot +// ResourceClaims exposes snapshot as ResourceClaimTracker +func (snapshot *DeltaSnapshotBase) ResourceClaims() schedulerframework.ResourceClaimTracker { + return snapshot.DraSnapshot().ResourceClaims() + } -// GetNodeInfo gets a NodeInfo. -func (snapshot *DeltaClusterSnapshot) GetNodeInfo(nodeName string) (*framework.NodeInfo, error) { - schedNodeInfo, err := snapshot.getNodeInfo(nodeName) - if err != nil { - return nil, err - } - return framework.WrapSchedulerNodeInfo(schedNodeInfo), nil +// ResourceSlices exposes snapshot as ResourceSliceLister. +func (snapshot *DeltaSnapshotBase) ResourceSlices() schedulerframework.ResourceSliceLister { + return snapshot.DraSnapshot().ResourceSlices() +} + +// DeviceClasses exposes the snapshot as DeviceClassLister. +func (snapshot *DeltaSnapshotBase) DeviceClasses() schedulerframework.DeviceClassLister { + return snapshot.DraSnapshot().DeviceClasses() +} + +// NewDeltaSnapshotBase creates instances of DeltaSnapshotBase. +func NewDeltaSnapshotBase() *DeltaSnapshotBase { + snapshot := &DeltaSnapshotBase{} + snapshot.clear() + return snapshot } -// ListNodeInfos lists NodeInfos. -func (snapshot *DeltaClusterSnapshot) ListNodeInfos() ([]*framework.NodeInfo, error) { - schedNodeInfos := snapshot.data.getNodeInfoList() - return framework.WrapSchedulerNodeInfos(schedNodeInfos), nil +// DraSnapshot returns the DRA snapshot. +func (snapshot *DeltaSnapshotBase) DraSnapshot() drasnapshot.Snapshot { + // TODO(DRA): Return DRA snapshot. + return drasnapshot.Snapshot{} } -// AddNodeInfo adds a NodeInfo. -func (snapshot *DeltaClusterSnapshot) AddNodeInfo(nodeInfo *framework.NodeInfo) error { +// AddSchedulerNodeInfo adds a NodeInfo. +func (snapshot *DeltaSnapshotBase) AddSchedulerNodeInfo(nodeInfo *schedulerframework.NodeInfo) error { if err := snapshot.data.addNode(nodeInfo.Node()); err != nil { return err } - for _, podInfo := range nodeInfo.Pods() { + for _, podInfo := range nodeInfo.Pods { if err := snapshot.data.addPod(podInfo.Pod, nodeInfo.Node().Name); err != nil { return err } @@ -422,7 +430,7 @@ func (snapshot *DeltaClusterSnapshot) AddNodeInfo(nodeInfo *framework.NodeInfo) } // SetClusterState sets the cluster state. -func (snapshot *DeltaClusterSnapshot) SetClusterState(nodes []*apiv1.Node, scheduledPods []*apiv1.Pod) error { +func (snapshot *DeltaSnapshotBase) SetClusterState(nodes []*apiv1.Node, scheduledPods []*apiv1.Pod, draSnapshot drasnapshot.Snapshot) error { snapshot.clear() knownNodes := make(map[string]bool) @@ -439,38 +447,39 @@ func (snapshot *DeltaClusterSnapshot) SetClusterState(nodes []*apiv1.Node, sched } } } + // TODO(DRA): Save DRA snapshot. return nil } -// RemoveNodeInfo removes nodes (and pods scheduled to it) from the snapshot. -func (snapshot *DeltaClusterSnapshot) RemoveNodeInfo(nodeName string) error { +// RemoveSchedulerNodeInfo removes nodes (and pods scheduled to it) from the snapshot. +func (snapshot *DeltaSnapshotBase) RemoveSchedulerNodeInfo(nodeName string) error { return snapshot.data.removeNodeInfo(nodeName) } // ForceAddPod adds pod to the snapshot and schedules it to given node. -func (snapshot *DeltaClusterSnapshot) ForceAddPod(pod *apiv1.Pod, nodeName string) error { +func (snapshot *DeltaSnapshotBase) ForceAddPod(pod *apiv1.Pod, nodeName string) error { return snapshot.data.addPod(pod, nodeName) } // ForceRemovePod removes pod from the snapshot. -func (snapshot *DeltaClusterSnapshot) ForceRemovePod(namespace, podName, nodeName string) error { +func (snapshot *DeltaSnapshotBase) ForceRemovePod(namespace, podName, nodeName string) error { return snapshot.data.removePod(namespace, podName, nodeName) } // IsPVCUsedByPods returns if the pvc is used by any pod -func (snapshot *DeltaClusterSnapshot) IsPVCUsedByPods(key string) bool { +func (snapshot *DeltaSnapshotBase) IsPVCUsedByPods(key string) bool { return snapshot.data.isPVCUsedByPods(key) } // Fork creates a fork of snapshot state. All modifications can later be reverted to moment of forking via Revert() // Time: O(1) -func (snapshot *DeltaClusterSnapshot) Fork() { +func (snapshot *DeltaSnapshotBase) Fork() { snapshot.data = snapshot.data.fork() } // Revert reverts snapshot state to moment of forking. // Time: O(1) -func (snapshot *DeltaClusterSnapshot) Revert() { +func (snapshot *DeltaSnapshotBase) Revert() { if snapshot.data.baseData != nil { snapshot.data = snapshot.data.baseData } @@ -478,7 +487,7 @@ func (snapshot *DeltaClusterSnapshot) Revert() { // Commit commits changes done after forking. // Time: O(n), where n = size of delta (number of nodes added, modified or deleted since forking) -func (snapshot *DeltaClusterSnapshot) Commit() error { +func (snapshot *DeltaSnapshotBase) Commit() error { newData, err := snapshot.data.commit() if err != nil { return err @@ -489,6 +498,6 @@ func (snapshot *DeltaClusterSnapshot) Commit() error { // Clear reset cluster snapshot to empty, unforked state // Time: O(1) -func (snapshot *DeltaClusterSnapshot) clear() { +func (snapshot *DeltaSnapshotBase) clear() { snapshot.data = newInternalDeltaSnapshotData() } diff --git a/cluster-autoscaler/simulator/clustersnapshot/base/delta_benchmark_test.go b/cluster-autoscaler/simulator/clustersnapshot/base/delta_benchmark_test.go new file mode 100644 index 000000000000..915a7a6cfcf8 --- /dev/null +++ b/cluster-autoscaler/simulator/clustersnapshot/base/delta_benchmark_test.go @@ -0,0 +1,88 @@ +/* +Copyright 2024 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package base + +import ( + "fmt" + "testing" + + "github.com/stretchr/testify/assert" + + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" + schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" +) + +func BenchmarkBuildNodeInfoList(b *testing.B) { + testCases := []struct { + nodeCount int + }{ + { + nodeCount: 1000, + }, + { + nodeCount: 5000, + }, + { + nodeCount: 15000, + }, + { + nodeCount: 100000, + }, + } + + for _, tc := range testCases { + b.Run(fmt.Sprintf("fork add 1000 to %d", tc.nodeCount), func(b *testing.B) { + nodes := clustersnapshot.CreateTestNodes(tc.nodeCount + 1000) + clusterSnapshot := NewDeltaSnapshotBase() + if err := clusterSnapshot.SetClusterState(nodes[:tc.nodeCount], nil, drasnapshot.Snapshot{}); err != nil { + assert.NoError(b, err) + } + clusterSnapshot.Fork() + for _, node := range nodes[tc.nodeCount:] { + schedNodeInfo := schedulerframework.NewNodeInfo() + schedNodeInfo.SetNode(node) + if err := clusterSnapshot.AddSchedulerNodeInfo(schedNodeInfo); err != nil { + assert.NoError(b, err) + } + } + b.ResetTimer() + for i := 0; i < b.N; i++ { + list := clusterSnapshot.data.buildNodeInfoList() + if len(list) != tc.nodeCount+1000 { + assert.Equal(b, len(list), tc.nodeCount+1000) + } + } + }) + } + for _, tc := range testCases { + b.Run(fmt.Sprintf("base %d", tc.nodeCount), func(b *testing.B) { + nodes := clustersnapshot.CreateTestNodes(tc.nodeCount) + clusterSnapshot := NewDeltaSnapshotBase() + if err := clusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}); err != nil { + assert.NoError(b, err) + } + b.ResetTimer() + for i := 0; i < b.N; i++ { + list := clusterSnapshot.data.buildNodeInfoList() + if len(list) != tc.nodeCount { + assert.Equal(b, len(list), tc.nodeCount) + } + } + }) + } +} diff --git a/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot.go b/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot.go index 1c60fcc0b730..2f61d1f594f5 100644 --- a/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot.go +++ b/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot.go @@ -20,6 +20,7 @@ import ( "errors" apiv1 "k8s.io/api/core/v1" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/klog/v2" schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" @@ -28,19 +29,10 @@ import ( // ClusterSnapshot is abstraction of cluster state used for predicate simulations. // It exposes mutation methods and can be viewed as scheduler's SharedLister. type ClusterSnapshot interface { - schedulerframework.SharedLister + SnapshotBase - // SetClusterState resets the snapshot to an unforked state and replaces the contents of the snapshot - // with the provided data. scheduledPods are correlated to their Nodes based on spec.NodeName. - SetClusterState(nodes []*apiv1.Node, scheduledPods []*apiv1.Pod) error - - // ForceAddPod adds the given Pod to the Node with the given nodeName inside the snapshot. - ForceAddPod(pod *apiv1.Pod, nodeName string) error - // ForceRemovePod removes the given Pod (and all DRA objects it owns) from the snapshot. - ForceRemovePod(namespace string, podName string, nodeName string) error - - // AddNodeInfo adds the given NodeInfo to the snapshot. The Node and the Pods are added, as well as - // any DRA objects passed along them. + // AddNodeInfo adds the given NodeInfo to the snapshot without checking scheduler predicates. The Node and the Pods are added, + // as well as any DRA objects passed along them. AddNodeInfo(nodeInfo *framework.NodeInfo) error // RemoveNodeInfo removes the given NodeInfo from the snapshot The Node and the Pods are removed, as well as // any DRA objects owned by them. @@ -52,6 +44,53 @@ type ClusterSnapshot interface { // ListNodeInfos returns internal NodeInfos for all Nodes tracked in the snapshot. See the comment on GetNodeInfo. ListNodeInfos() ([]*framework.NodeInfo, error) + // SchedulePod tries to schedule the given Pod on the Node with the given name inside the snapshot, + // checking scheduling predicates. The pod is only scheduled if the predicates pass. If the pod is scheduled, + // all relevant DRA objects are modified to reflect that. Returns nil if the pod got scheduled, and a non-nil + // error explaining why not otherwise. The error type can be checked to distinguish failing predicates + // from unexpected errors. + SchedulePod(pod *apiv1.Pod, nodeName string) SchedulingError + // SchedulePodOnAnyNodeMatching tries to schedule the given Pod on any Node for which nodeMatches returns + // true. Scheduling predicates are checked, and the pod is scheduled only if there is a matching Node with passing + // predicates. If the pod is scheduled, all relevant DRA objects are modified to reflect that, and the name of the + // Node its scheduled on and nil are returned. If the pod can't be scheduled on any Node, an empty string and a non-nil + // error explaining why are returned. The error type can be checked to distinguish failing predicates from unexpected errors. + SchedulePodOnAnyNodeMatching(pod *apiv1.Pod, nodeMatches func(*framework.NodeInfo) bool) (matchingNode string, err SchedulingError) + // UnschedulePod removes the given Pod from the given Node inside the snapshot, and modifies all relevant DRA objects + // to reflect the removal. The pod can then be scheduled on another Node in the snapshot using the Schedule methods. + UnschedulePod(namespace string, podName string, nodeName string) error + + // CheckPredicates runs scheduler predicates to check if the given Pod would be able to schedule on the Node with the given + // name. Returns nil if predicates pass, or a non-nil error specifying why they didn't otherwise. The error type can be checked + // to distinguish failing predicates from unexpected errors. Doesn't mutate the snapshot. + CheckPredicates(pod *apiv1.Pod, nodeName string) SchedulingError +} + +// SnapshotBase is the "low-level" part of ClusterSnapshot. Mutation methods modify the snapshot state directly, without going +// through scheduler predicates. +type SnapshotBase interface { + framework.SharedLister + + // SetClusterState resets the snapshot to an unforked state and replaces the contents of the snapshot + // with the provided data. scheduledPods are correlated to their Nodes based on spec.NodeName. + SetClusterState(nodes []*apiv1.Node, scheduledPods []*apiv1.Pod, draSnapshot drasnapshot.Snapshot) error + + // ForceAddPod adds the given Pod to the Node with the given nodeName inside the snapshot. + ForceAddPod(pod *apiv1.Pod, nodeName string) error + // ForceRemovePod removes the given Pod (and all DRA objects it owns) from the snapshot. + ForceRemovePod(namespace string, podName string, nodeName string) error + + // AddSchedulerNodeInfo adds the given schedulerframework.NodeInfo to the snapshot without checking scheduler predicates, and + // without taking DRA objects into account. This shouldn't be used outside the clustersnapshot pkg, use ClusterSnapshot.AddNodeInfo() + // instead. + AddSchedulerNodeInfo(nodeInfo *schedulerframework.NodeInfo) error + // RemoveSchedulerNodeInfo removes the given schedulerframework.NodeInfo from the snapshot without taking DRA objects into account. This shouldn't + // be used outside the clustersnapshot pkg, use ClusterSnapshot.RemoveNodeInfo() instead. + RemoveSchedulerNodeInfo(nodeName string) error + + // DraSnapshot returns an interface that allows accessing and modifying the DRA objects in the snapshot. + DraSnapshot() drasnapshot.Snapshot + // Fork creates a fork of snapshot state. All modifications can later be reverted to moment of forking via Revert(). // Use WithForkedSnapshot() helper function instead if possible. Fork() diff --git a/cluster-autoscaler/simulator/clustersnapshot/error.go b/cluster-autoscaler/simulator/clustersnapshot/error.go new file mode 100644 index 000000000000..87b988c5bf6c --- /dev/null +++ b/cluster-autoscaler/simulator/clustersnapshot/error.go @@ -0,0 +1,149 @@ +/* +Copyright 2019 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package clustersnapshot + +import ( + "fmt" + "strings" + + apiv1 "k8s.io/api/core/v1" +) + +// SchedulingErrorType represents different possible schedulingError types. +type SchedulingErrorType int + +const ( + // SchedulingInternalError denotes internal unexpected error while trying to schedule a pod + SchedulingInternalError SchedulingErrorType = iota + // FailingPredicateError means that a pod couldn't be scheduled on a particular node because of a failing scheduler predicate + FailingPredicateError + // NoNodesPassingPredicatesFoundError means that a pod couldn't be scheduled on any Node because of failing scheduler predicates + NoNodesPassingPredicatesFoundError +) + +// SchedulingError represents an error encountered while trying to schedule a Pod inside ClusterSnapshot. +// An interface is exported instead of the concrete type to avoid the dreaded https://go.dev/doc/faq#nil_error. +type SchedulingError interface { + error + + // Type can be used to distinguish between different SchedulingError types. + Type() SchedulingErrorType + // Reasons provides a list of human-readable reasons explaining the error. + Reasons() []string + + // FailingPredicateName returns the name of the predicate that failed. Only applicable to the FailingPredicateError type. + FailingPredicateName() string + // FailingPredicateReasons returns a list of human-readable reasons explaining why the predicate failed. Only applicable to the FailingPredicateError type. + FailingPredicateReasons() []string +} + +type schedulingError struct { + errorType SchedulingErrorType + pod *apiv1.Pod + + // Only applicable to SchedulingInternalError: + internalErrorMsg string + + // Only applicable to FailingPredicateError: + failingPredicateName string + failingPredicateReasons []string + failingPredicateUnexpectedErrMsg string + // debugInfo contains additional info that predicate doesn't include, + // but may be useful for debugging (e.g. taints on node blocking scale-up) + failingPredicateDebugInfo string +} + +// Type returns if error was internal of names predicate failure. +func (se *schedulingError) Type() SchedulingErrorType { + return se.errorType +} + +// Error satisfies the builtin error interface. +func (se *schedulingError) Error() string { + msg := "" + + switch se.errorType { + case SchedulingInternalError: + msg = fmt.Sprintf("unexpected error: %s", se.internalErrorMsg) + case FailingPredicateError: + details := []string{ + fmt.Sprintf("predicateReasons=[%s]", strings.Join(se.FailingPredicateReasons(), ", ")), + } + if se.failingPredicateDebugInfo != "" { + details = append(details, fmt.Sprintf("debugInfo=%s", se.failingPredicateDebugInfo)) + } + if se.failingPredicateUnexpectedErrMsg != "" { + details = append(details, fmt.Sprintf("unexpectedError=%s", se.failingPredicateUnexpectedErrMsg)) + } + msg = fmt.Sprintf("predicate %q didn't pass (%s)", se.FailingPredicateName(), strings.Join(details, "; ")) + case NoNodesPassingPredicatesFoundError: + msg = fmt.Sprintf("couldn't find a matching Node with passing predicates") + default: + msg = fmt.Sprintf("SchedulingErrorType type %q unknown - this shouldn't happen", se.errorType) + } + + return fmt.Sprintf("can't schedule pod %s/%s: %s", se.pod.Namespace, se.pod.Name, msg) +} + +// Reasons returns a list of human-readable reasons for the error. +func (se *schedulingError) Reasons() []string { + switch se.errorType { + case FailingPredicateError: + return se.FailingPredicateReasons() + default: + return []string{se.Error()} + } +} + +// FailingPredicateName returns the name of the predicate which failed. +func (se *schedulingError) FailingPredicateName() string { + return se.failingPredicateName +} + +// FailingPredicateReasons returns the failure reasons from the failed predicate as a slice of strings. +func (se *schedulingError) FailingPredicateReasons() []string { + return se.failingPredicateReasons +} + +// NewSchedulingInternalError creates a new schedulingError with SchedulingInternalError type. +func NewSchedulingInternalError(pod *apiv1.Pod, errMsg string) SchedulingError { + return &schedulingError{ + errorType: SchedulingInternalError, + pod: pod, + internalErrorMsg: errMsg, + } +} + +// NewFailingPredicateError creates a new schedulingError with FailingPredicateError type. +func NewFailingPredicateError(pod *apiv1.Pod, predicateName string, predicateReasons []string, unexpectedErrMsg string, debugInfo string) SchedulingError { + return &schedulingError{ + errorType: FailingPredicateError, + pod: pod, + failingPredicateName: predicateName, + failingPredicateReasons: predicateReasons, + failingPredicateUnexpectedErrMsg: unexpectedErrMsg, + failingPredicateDebugInfo: debugInfo, + } +} + +// NewNoNodesPassingPredicatesFoundError creates a new schedulingError with NoNodesPassingPredicatesFoundError type. +func NewNoNodesPassingPredicatesFoundError(pod *apiv1.Pod) SchedulingError { + return &schedulingError{ + errorType: NoNodesPassingPredicatesFoundError, + pod: pod, + } +} diff --git a/cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner.go b/cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner.go new file mode 100644 index 000000000000..b7b30e989959 --- /dev/null +++ b/cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner.go @@ -0,0 +1,138 @@ +/* +Copyright 2016 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package predicate + +import ( + "context" + "fmt" + "strings" + + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + + apiv1 "k8s.io/api/core/v1" + schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" +) + +// SchedulerPluginRunner can be used to run various phases of scheduler plugins through the scheduler framework. +type SchedulerPluginRunner struct { + fwHandle *framework.Handle + snapshot clustersnapshot.ClusterSnapshot + lastIndex int +} + +// NewSchedulerPluginRunner builds a SchedulerPluginRunner. +func NewSchedulerPluginRunner(fwHandle *framework.Handle, snapshot clustersnapshot.ClusterSnapshot) *SchedulerPluginRunner { + return &SchedulerPluginRunner{fwHandle: fwHandle, snapshot: snapshot} +} + +// RunFiltersUntilPassingNode runs the scheduler framework PreFilter phase once, and then keeps running the Filter phase for all nodes in the cluster that match the provided +// function - until a Node where the filters pass is found. Filters are only run for matching Nodes. If no matching node with passing filters is found, an error is returned. +// +// The node iteration always starts from the next Node from the last Node that was found by this method. TODO: Extract the iteration strategy out of SchedulerPluginRunner. +func (p *SchedulerPluginRunner) RunFiltersUntilPassingNode(pod *apiv1.Pod, nodeMatches func(*framework.NodeInfo) bool) (*apiv1.Node, *schedulerframework.CycleState, clustersnapshot.SchedulingError) { + nodeInfosList, err := p.snapshot.ListNodeInfos() + if err != nil { + return nil, nil, clustersnapshot.NewSchedulingInternalError(pod, "ClusterSnapshot not provided") + } + + p.fwHandle.DelegatingLister.UpdateDelegate(p.snapshot) + defer p.fwHandle.DelegatingLister.ResetDelegate() + + state := schedulerframework.NewCycleState() + preFilterResult, preFilterStatus, _ := p.fwHandle.Framework.RunPreFilterPlugins(context.TODO(), state, pod) + if !preFilterStatus.IsSuccess() { + return nil, nil, clustersnapshot.NewFailingPredicateError(pod, preFilterStatus.Plugin(), preFilterStatus.Reasons(), "PreFilter failed", "") + } + + for i := range nodeInfosList { + nodeInfo := nodeInfosList[(p.lastIndex+i)%len(nodeInfosList)] + if !nodeMatches(nodeInfo) { + continue + } + + if !preFilterResult.AllNodes() && !preFilterResult.NodeNames.Has(nodeInfo.Node().Name) { + continue + } + + // Be sure that the node is schedulable. + if nodeInfo.Node().Spec.Unschedulable { + continue + } + + filterStatus := p.fwHandle.Framework.RunFilterPlugins(context.TODO(), state, pod, nodeInfo.ToScheduler()) + if filterStatus.IsSuccess() { + p.lastIndex = (p.lastIndex + i + 1) % len(nodeInfosList) + return nodeInfo.Node(), state, nil + } + } + return nil, nil, clustersnapshot.NewNoNodesPassingPredicatesFoundError(pod) +} + +// RunFiltersOnNode runs the scheduler framework PreFilter and Filter phases to check if the given pod can be scheduled on the given node. +func (p *SchedulerPluginRunner) RunFiltersOnNode(pod *apiv1.Pod, nodeName string) (*apiv1.Node, *schedulerframework.CycleState, clustersnapshot.SchedulingError) { + nodeInfo, err := p.snapshot.GetNodeInfo(nodeName) + if err != nil { + return nil, nil, clustersnapshot.NewSchedulingInternalError(pod, fmt.Sprintf("error obtaining NodeInfo for name %q: %v", nodeName, err)) + } + + p.fwHandle.DelegatingLister.UpdateDelegate(p.snapshot) + defer p.fwHandle.DelegatingLister.ResetDelegate() + + state := schedulerframework.NewCycleState() + _, preFilterStatus, _ := p.fwHandle.Framework.RunPreFilterPlugins(context.TODO(), state, pod) + if !preFilterStatus.IsSuccess() { + return nil, nil, clustersnapshot.NewFailingPredicateError(pod, preFilterStatus.Plugin(), preFilterStatus.Reasons(), "PreFilter failed", "") + } + + filterStatus := p.fwHandle.Framework.RunFilterPlugins(context.TODO(), state, pod, nodeInfo.ToScheduler()) + + if !filterStatus.IsSuccess() { + filterName := filterStatus.Plugin() + filterReasons := filterStatus.Reasons() + unexpectedErrMsg := "" + if !filterStatus.IsRejected() { + unexpectedErrMsg = fmt.Sprintf("unexpected filter status %q", filterStatus.Code().String()) + } + return nil, nil, clustersnapshot.NewFailingPredicateError(pod, filterName, filterReasons, unexpectedErrMsg, p.failingFilterDebugInfo(filterName, nodeInfo)) + } + + return nodeInfo.Node(), state, nil +} + +// RunReserveOnNode runs the scheduler framework Reserve phase to update the scheduler plugins state to reflect the Pod being scheduled on the Node. +func (p *SchedulerPluginRunner) RunReserveOnNode(pod *apiv1.Pod, nodeName string, postFilterState *schedulerframework.CycleState) error { + p.fwHandle.DelegatingLister.UpdateDelegate(p.snapshot) + defer p.fwHandle.DelegatingLister.ResetDelegate() + + status := p.fwHandle.Framework.RunReservePluginsReserve(context.Background(), postFilterState, pod, nodeName) + if !status.IsSuccess() { + return fmt.Errorf("couldn't reserve node %s for pod %s/%s: %v", nodeName, pod.Namespace, pod.Name, status.Message()) + } + return nil +} + +func (p *SchedulerPluginRunner) failingFilterDebugInfo(filterName string, nodeInfo *framework.NodeInfo) string { + infoParts := []string{fmt.Sprintf("nodeName: %q", nodeInfo.Node().Name)} + + switch filterName { + case "TaintToleration": + infoParts = append(infoParts, fmt.Sprintf("nodeTaints: %#v", nodeInfo.Node().Spec.Taints)) + } + + return strings.Join(infoParts, ", ") +} diff --git a/cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner_test.go b/cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner_test.go new file mode 100644 index 000000000000..c1d345c9e54b --- /dev/null +++ b/cluster-autoscaler/simulator/clustersnapshot/predicate/plugin_runner_test.go @@ -0,0 +1,337 @@ +/* +Copyright 2020 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package predicate + +import ( + "os" + "path/filepath" + "testing" + "time" + + "github.com/stretchr/testify/assert" + + "k8s.io/client-go/informers" + clientsetfake "k8s.io/client-go/kubernetes/fake" + "k8s.io/kubernetes/pkg/scheduler/apis/config" + scheduler_config_latest "k8s.io/kubernetes/pkg/scheduler/apis/config/latest" + + testconfig "k8s.io/autoscaler/cluster-autoscaler/config/test" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + "k8s.io/autoscaler/cluster-autoscaler/utils/scheduler" + . "k8s.io/autoscaler/cluster-autoscaler/utils/test" + + apiv1 "k8s.io/api/core/v1" +) + +func TestRunFiltersOnNode(t *testing.T) { + p450 := BuildTestPod("p450", 450, 500000) + p600 := BuildTestPod("p600", 600, 500000) + p8000 := BuildTestPod("p8000", 8000, 0) + p500 := BuildTestPod("p500", 500, 500000) + + n1000 := BuildTestNode("n1000", 1000, 2000000) + SetNodeReadyState(n1000, true, time.Time{}) + n1000Unschedulable := BuildTestNode("n1000", 1000, 2000000) + SetNodeReadyState(n1000Unschedulable, true, time.Time{}) + + // temp dir + tmpDir, err := os.MkdirTemp("", "scheduler-configs") + if err != nil { + t.Fatal(err) + } + defer os.RemoveAll(tmpDir) + + customConfigFile := filepath.Join(tmpDir, "custom_config.yaml") + if err := os.WriteFile(customConfigFile, + []byte(testconfig.SchedulerConfigNodeResourcesFitDisabled), + os.FileMode(0600)); err != nil { + t.Fatal(err) + } + customConfig, err := scheduler.ConfigFromPath(customConfigFile) + assert.NoError(t, err) + + tests := []struct { + name string + customConfig *config.KubeSchedulerConfiguration + node *apiv1.Node + scheduledPods []*apiv1.Pod + testPod *apiv1.Pod + expectError bool + }{ + // default predicate checker test cases + { + name: "default - other pod - insuficient cpu", + node: n1000, + scheduledPods: []*apiv1.Pod{p450}, + testPod: p600, + expectError: true, + }, + { + name: "default - other pod - ok", + node: n1000, + scheduledPods: []*apiv1.Pod{p450}, + testPod: p500, + expectError: false, + }, + { + name: "default - empty - insuficient cpu", + node: n1000, + scheduledPods: []*apiv1.Pod{}, + testPod: p8000, + expectError: true, + }, + { + name: "default - empty - ok", + node: n1000, + scheduledPods: []*apiv1.Pod{}, + testPod: p600, + expectError: false, + }, + // custom predicate checker test cases + { + name: "custom - other pod - ok", + node: n1000, + scheduledPods: []*apiv1.Pod{p450}, + testPod: p600, + expectError: false, + customConfig: customConfig, + }, + { + name: "custom -other pod - ok", + node: n1000, + scheduledPods: []*apiv1.Pod{p450}, + testPod: p500, + expectError: false, + customConfig: customConfig, + }, + { + name: "custom -empty - ok", + node: n1000, + scheduledPods: []*apiv1.Pod{}, + testPod: p8000, + expectError: false, + customConfig: customConfig, + }, + { + name: "custom -empty - ok", + node: n1000, + scheduledPods: []*apiv1.Pod{}, + testPod: p600, + expectError: false, + customConfig: customConfig, + }, + } + for _, tt := range tests { + t.Run(tt.name, func(t *testing.T) { + pluginRunner, snapshot, err := newTestPluginRunnerAndSnapshot(tt.customConfig) + assert.NoError(t, err) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(tt.node, tt.scheduledPods...)) + assert.NoError(t, err) + + node, state, predicateError := pluginRunner.RunFiltersOnNode(tt.testPod, tt.node.Name) + if tt.expectError { + assert.Nil(t, node) + assert.Nil(t, state) + assert.NotNil(t, predicateError) + assert.Equal(t, clustersnapshot.FailingPredicateError, predicateError.Type()) + assert.Equal(t, "NodeResourcesFit", predicateError.FailingPredicateName()) + assert.Equal(t, []string{"Insufficient cpu"}, predicateError.FailingPredicateReasons()) + assert.Contains(t, predicateError.Error(), "NodeResourcesFit") + assert.Contains(t, predicateError.Error(), "Insufficient cpu") + } else { + assert.Nil(t, predicateError) + assert.NotNil(t, state) + assert.Equal(t, tt.node, node) + } + }) + } +} + +func TestRunFilterUntilPassingNode(t *testing.T) { + p900 := BuildTestPod("p900", 900, 1000) + p1900 := BuildTestPod("p1900", 1900, 1000) + p2100 := BuildTestPod("p2100", 2100, 1000) + + n1000 := BuildTestNode("n1000", 1000, 2000000) + n2000 := BuildTestNode("n2000", 2000, 2000000) + + // temp dir + tmpDir, err := os.MkdirTemp("", "scheduler-configs") + if err != nil { + t.Fatal(err) + } + defer os.RemoveAll(tmpDir) + + customConfigFile := filepath.Join(tmpDir, "custom_config.yaml") + if err := os.WriteFile(customConfigFile, + []byte(testconfig.SchedulerConfigNodeResourcesFitDisabled), + os.FileMode(0600)); err != nil { + t.Fatal(err) + } + customConfig, err := scheduler.ConfigFromPath(customConfigFile) + assert.NoError(t, err) + + testCases := []struct { + name string + customConfig *config.KubeSchedulerConfiguration + pod *apiv1.Pod + expectedNodes []string + expectError bool + }{ + // default predicate checker test cases + { + name: "default - small pod - no error", + pod: p900, + expectedNodes: []string{"n1000", "n2000"}, + expectError: false, + }, + { + name: "default - medium pod - no error", + pod: p1900, + expectedNodes: []string{"n2000"}, + expectError: false, + }, + { + name: "default - large pod - insufficient cpu", + pod: p2100, + expectError: true, + }, + + // custom predicate checker test cases + { + name: "custom - small pod - no error", + customConfig: customConfig, + pod: p900, + expectedNodes: []string{"n1000", "n2000"}, + expectError: false, + }, + { + name: "custom - medium pod - no error", + customConfig: customConfig, + pod: p1900, + expectedNodes: []string{"n1000", "n2000"}, + expectError: false, + }, + { + name: "custom - large pod - insufficient cpu", + customConfig: customConfig, + pod: p2100, + expectedNodes: []string{"n1000", "n2000"}, + expectError: false, + }, + } + + for _, tc := range testCases { + t.Run(tc.name, func(t *testing.T) { + pluginRunner, snapshot, err := newTestPluginRunnerAndSnapshot(tc.customConfig) + assert.NoError(t, err) + + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(n1000)) + assert.NoError(t, err) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(n2000)) + assert.NoError(t, err) + + node, state, err := pluginRunner.RunFiltersUntilPassingNode(tc.pod, func(info *framework.NodeInfo) bool { return true }) + if tc.expectError { + assert.Nil(t, node) + assert.Nil(t, state) + assert.Error(t, err) + } else { + assert.NoError(t, err) + assert.NotNil(t, state) + assert.Contains(t, tc.expectedNodes, node.Name) + } + }) + } +} + +func TestDebugInfo(t *testing.T) { + p1 := BuildTestPod("p1", 0, 0) + node1 := BuildTestNode("n1", 1000, 2000000) + node1.Spec.Taints = []apiv1.Taint{ + { + Key: "SomeTaint", + Value: "WhyNot?", + Effect: apiv1.TaintEffectNoSchedule, + }, + { + Key: "RandomTaint", + Value: "JustBecause", + Effect: apiv1.TaintEffectNoExecute, + }, + } + SetNodeReadyState(node1, true, time.Time{}) + + // with default predicate checker + defaultPluginnRunner, clusterSnapshot, err := newTestPluginRunnerAndSnapshot(nil) + assert.NoError(t, err) + + err = clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(node1)) + assert.NoError(t, err) + + _, _, predicateErr := defaultPluginnRunner.RunFiltersOnNode(p1, "n1") + assert.NotNil(t, predicateErr) + assert.Contains(t, predicateErr.FailingPredicateReasons(), "node(s) had untolerated taint {SomeTaint: WhyNot?}") + assert.Contains(t, predicateErr.Error(), "node(s) had untolerated taint {SomeTaint: WhyNot?}") + assert.Contains(t, predicateErr.Error(), "RandomTaint") + + // with custom predicate checker + + // temp dir + tmpDir, err := os.MkdirTemp("", "scheduler-configs") + if err != nil { + t.Fatal(err) + } + defer os.RemoveAll(tmpDir) + + customConfigFile := filepath.Join(tmpDir, "custom_config.yaml") + if err := os.WriteFile(customConfigFile, + []byte(testconfig.SchedulerConfigTaintTolerationDisabled), + os.FileMode(0600)); err != nil { + t.Fatal(err) + } + + customConfig, err := scheduler.ConfigFromPath(customConfigFile) + assert.NoError(t, err) + customPluginnRunner, clusterSnapshot, err := newTestPluginRunnerAndSnapshot(customConfig) + assert.NoError(t, err) + + err = clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(node1)) + assert.NoError(t, err) + + _, _, predicateErr = customPluginnRunner.RunFiltersOnNode(p1, "n1") + assert.Nil(t, predicateErr) +} + +func newTestPluginRunnerAndSnapshot(schedConfig *config.KubeSchedulerConfiguration) (*SchedulerPluginRunner, clustersnapshot.ClusterSnapshot, error) { + if schedConfig == nil { + defaultConfig, err := scheduler_config_latest.Default() + if err != nil { + return nil, nil, err + } + schedConfig = defaultConfig + } + + fwHandle, err := framework.NewHandle(informers.NewSharedInformerFactory(clientsetfake.NewSimpleClientset(), 0), schedConfig, true) + if err != nil { + return nil, nil, err + } + snapshot := NewPredicateSnapshot(base.NewBasicSnapshotBase(), fwHandle, false) + return NewSchedulerPluginRunner(fwHandle, snapshot), snapshot, nil +} diff --git a/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot.go b/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot.go new file mode 100644 index 000000000000..8e9c39c20074 --- /dev/null +++ b/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot.go @@ -0,0 +1,107 @@ +/* +Copyright 2016 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package predicate + +import ( + apiv1 "k8s.io/api/core/v1" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" +) + +// PredicateSnapshot implements ClusterSnapshot on top of a SnapshotBase by using +// SchedulerBasedPredicateChecker to check scheduler predicates. +type PredicateSnapshot struct { + clustersnapshot.SnapshotBase + pluginRunner *SchedulerPluginRunner + draEnabled bool +} + +// NewPredicateSnapshot builds a PredicateSnapshot. +func NewPredicateSnapshot(snapshotBase clustersnapshot.SnapshotBase, fwHandle *framework.Handle, draEnabled bool) *PredicateSnapshot { + snapshot := &PredicateSnapshot{ + SnapshotBase: snapshotBase, + draEnabled: draEnabled, + } + snapshot.pluginRunner = NewSchedulerPluginRunner(fwHandle, snapshot) + return snapshot +} + +// GetNodeInfo returns an internal NodeInfo wrapping the relevant schedulerframework.NodeInfo. +func (s *PredicateSnapshot) GetNodeInfo(nodeName string) (*framework.NodeInfo, error) { + schedNodeInfo, err := s.SnapshotBase.NodeInfos().Get(nodeName) + if err != nil { + return nil, err + } + return framework.WrapSchedulerNodeInfo(schedNodeInfo, nil, nil), nil +} + +// ListNodeInfos returns internal NodeInfos wrapping all schedulerframework.NodeInfos in the snapshot. +func (s *PredicateSnapshot) ListNodeInfos() ([]*framework.NodeInfo, error) { + schedNodeInfos, err := s.SnapshotBase.NodeInfos().List() + if err != nil { + return nil, err + } + var result []*framework.NodeInfo + for _, schedNodeInfo := range schedNodeInfos { + result = append(result, framework.WrapSchedulerNodeInfo(schedNodeInfo, nil, nil)) + } + return result, nil +} + +// AddNodeInfo adds the provided internal NodeInfo to the snapshot. +func (s *PredicateSnapshot) AddNodeInfo(nodeInfo *framework.NodeInfo) error { + return s.SnapshotBase.AddSchedulerNodeInfo(nodeInfo.ToScheduler()) +} + +// RemoveNodeInfo removes a NodeInfo matching the provided nodeName from the snapshot. +func (s *PredicateSnapshot) RemoveNodeInfo(nodeName string) error { + return s.SnapshotBase.RemoveSchedulerNodeInfo(nodeName) +} + +// SchedulePod adds pod to the snapshot and schedules it to given node. +func (s *PredicateSnapshot) SchedulePod(pod *apiv1.Pod, nodeName string) clustersnapshot.SchedulingError { + if _, _, schedErr := s.pluginRunner.RunFiltersOnNode(pod, nodeName); schedErr != nil { + return schedErr + } + if err := s.ForceAddPod(pod, nodeName); err != nil { + return clustersnapshot.NewSchedulingInternalError(pod, err.Error()) + } + return nil +} + +// SchedulePodOnAnyNodeMatching adds pod to the snapshot and schedules it to any node matching the provided function. +func (s *PredicateSnapshot) SchedulePodOnAnyNodeMatching(pod *apiv1.Pod, anyNodeMatching func(*framework.NodeInfo) bool) (string, clustersnapshot.SchedulingError) { + node, _, schedErr := s.pluginRunner.RunFiltersUntilPassingNode(pod, anyNodeMatching) + if schedErr != nil { + return "", schedErr + } + if err := s.ForceAddPod(pod, node.Name); err != nil { + return "", clustersnapshot.NewSchedulingInternalError(pod, err.Error()) + } + return node.Name, nil +} + +// UnschedulePod removes the given Pod from the given Node inside the snapshot. +func (s *PredicateSnapshot) UnschedulePod(namespace string, podName string, nodeName string) error { + return s.ForceRemovePod(namespace, podName, nodeName) +} + +// CheckPredicates checks whether scheduler predicates pass for the given pod on the given node. +func (s *PredicateSnapshot) CheckPredicates(pod *apiv1.Pod, nodeName string) clustersnapshot.SchedulingError { + _, _, err := s.pluginRunner.RunFiltersOnNode(pod, nodeName) + return err +} diff --git a/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot_benchmark_test.go b/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot_benchmark_test.go similarity index 53% rename from cluster-autoscaler/simulator/clustersnapshot/clustersnapshot_benchmark_test.go rename to cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot_benchmark_test.go index fb6468adad6f..7a2123e059d3 100644 --- a/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot_benchmark_test.go +++ b/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot_benchmark_test.go @@ -14,73 +14,33 @@ See the License for the specific language governing permissions and limitations under the License. */ -package clustersnapshot +package predicate import ( "fmt" "testing" - "time" "github.com/stretchr/testify/assert" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - - apiv1 "k8s.io/api/core/v1" ) -func createTestNodesWithPrefix(prefix string, n int) []*apiv1.Node { - nodes := make([]*apiv1.Node, n, n) - for i := 0; i < n; i++ { - nodes[i] = BuildTestNode(fmt.Sprintf("%s-%d", prefix, i), 2000, 2000000) - SetNodeReadyState(nodes[i], true, time.Time{}) - } - return nodes -} - -func createTestNodes(n int) []*apiv1.Node { - return createTestNodesWithPrefix("n", n) -} - -func createTestPodsWithPrefix(prefix string, n int) []*apiv1.Pod { - pods := make([]*apiv1.Pod, n, n) - for i := 0; i < n; i++ { - pods[i] = BuildTestPod(fmt.Sprintf("%s-%d", prefix, i), 1000, 2000000) - } - return pods -} - -func createTestPods(n int) []*apiv1.Pod { - return createTestPodsWithPrefix("p", n) -} - -func assignPodsToNodes(pods []*apiv1.Pod, nodes []*apiv1.Node) { - if len(nodes) == 0 { - return - } - - j := 0 - for i := 0; i < len(pods); i++ { - if j >= len(nodes) { - j = 0 - } - pods[i].Spec.NodeName = nodes[j].Name - j++ - } -} - func BenchmarkAddNodeInfo(b *testing.B) { testCases := []int{1, 10, 100, 1000, 5000, 15000, 100000} for snapshotName, snapshotFactory := range snapshots { for _, tc := range testCases { - nodes := createTestNodes(tc) - clusterSnapshot := snapshotFactory() + nodes := clustersnapshot.CreateTestNodes(tc) + clusterSnapshot, err := snapshotFactory() + assert.NoError(b, err) b.ResetTimer() b.Run(fmt.Sprintf("%s: AddNodeInfo() %d", snapshotName, tc), func(b *testing.B) { for i := 0; i < b.N; i++ { b.StopTimer() - assert.NoError(b, clusterSnapshot.SetClusterState(nil, nil)) + assert.NoError(b, clusterSnapshot.SetClusterState(nil, nil, drasnapshot.Snapshot{})) b.StartTimer() for _, node := range nodes { err := clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) @@ -99,9 +59,10 @@ func BenchmarkListNodeInfos(b *testing.B) { for snapshotName, snapshotFactory := range snapshots { for _, tc := range testCases { - nodes := createTestNodes(tc) - clusterSnapshot := snapshotFactory() - err := clusterSnapshot.SetClusterState(nodes, nil) + nodes := clustersnapshot.CreateTestNodes(tc) + clusterSnapshot, err := snapshotFactory() + assert.NoError(b, err) + err = clusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) if err != nil { assert.NoError(b, err) } @@ -126,18 +87,19 @@ func BenchmarkAddPods(b *testing.B) { for snapshotName, snapshotFactory := range snapshots { for _, tc := range testCases { - nodes := createTestNodes(tc) - pods := createTestPods(tc * 30) - assignPodsToNodes(pods, nodes) - clusterSnapshot := snapshotFactory() - err := clusterSnapshot.SetClusterState(nodes, nil) + nodes := clustersnapshot.CreateTestNodes(tc) + pods := clustersnapshot.CreateTestPods(tc * 30) + clustersnapshot.AssignTestPodsToNodes(pods, nodes) + clusterSnapshot, err := snapshotFactory() + assert.NoError(b, err) + err = clusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) assert.NoError(b, err) b.ResetTimer() b.Run(fmt.Sprintf("%s: ForceAddPod() 30*%d", snapshotName, tc), func(b *testing.B) { for i := 0; i < b.N; i++ { b.StopTimer() - err = clusterSnapshot.SetClusterState(nodes, nil) + err = clusterSnapshot.SetClusterState(nodes, nil, drasnapshot.Snapshot{}) if err != nil { assert.NoError(b, err) } @@ -160,12 +122,13 @@ func BenchmarkForkAddRevert(b *testing.B) { for snapshotName, snapshotFactory := range snapshots { for _, ntc := range nodeTestCases { - nodes := createTestNodes(ntc) + nodes := clustersnapshot.CreateTestNodes(ntc) for _, ptc := range podTestCases { - pods := createTestPods(ntc * ptc) - assignPodsToNodes(pods, nodes) - clusterSnapshot := snapshotFactory() - err := clusterSnapshot.SetClusterState(nodes, pods) + pods := clustersnapshot.CreateTestPods(ntc * ptc) + clustersnapshot.AssignTestPodsToNodes(pods, nodes) + clusterSnapshot, err := snapshotFactory() + assert.NoError(b, err) + err = clusterSnapshot.SetClusterState(nodes, pods, drasnapshot.Snapshot{}) assert.NoError(b, err) tmpNode1 := BuildTestNode("tmp-1", 2000, 2000000) tmpNode2 := BuildTestNode("tmp-2", 2000, 2000000) @@ -190,61 +153,3 @@ func BenchmarkForkAddRevert(b *testing.B) { } } } - -func BenchmarkBuildNodeInfoList(b *testing.B) { - testCases := []struct { - nodeCount int - }{ - { - nodeCount: 1000, - }, - { - nodeCount: 5000, - }, - { - nodeCount: 15000, - }, - { - nodeCount: 100000, - }, - } - - for _, tc := range testCases { - b.Run(fmt.Sprintf("fork add 1000 to %d", tc.nodeCount), func(b *testing.B) { - nodes := createTestNodes(tc.nodeCount + 1000) - snapshot := NewDeltaClusterSnapshot() - if err := snapshot.SetClusterState(nodes[:tc.nodeCount], nil); err != nil { - assert.NoError(b, err) - } - snapshot.Fork() - for _, node := range nodes[tc.nodeCount:] { - if err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)); err != nil { - assert.NoError(b, err) - } - } - b.ResetTimer() - for i := 0; i < b.N; i++ { - list := snapshot.data.buildNodeInfoList() - if len(list) != tc.nodeCount+1000 { - assert.Equal(b, len(list), tc.nodeCount+1000) - } - } - }) - } - for _, tc := range testCases { - b.Run(fmt.Sprintf("base %d", tc.nodeCount), func(b *testing.B) { - nodes := createTestNodes(tc.nodeCount) - snapshot := NewDeltaClusterSnapshot() - if err := snapshot.SetClusterState(nodes, nil); err != nil { - assert.NoError(b, err) - } - b.ResetTimer() - for i := 0; i < b.N; i++ { - list := snapshot.data.buildNodeInfoList() - if len(list) != tc.nodeCount { - assert.Equal(b, len(list), tc.nodeCount) - } - } - }) - } -} diff --git a/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot_test.go b/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot_test.go similarity index 81% rename from cluster-autoscaler/simulator/clustersnapshot/clustersnapshot_test.go rename to cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot_test.go index 4eeb67253558..c490c9cd3aa2 100644 --- a/cluster-autoscaler/simulator/clustersnapshot/clustersnapshot_test.go +++ b/cluster-autoscaler/simulator/clustersnapshot/predicate/predicate_snapshot_test.go @@ -14,7 +14,7 @@ See the License for the specific language governing permissions and limitations under the License. */ -package clustersnapshot +package predicate import ( "fmt" @@ -23,6 +23,9 @@ import ( "time" apiv1 "k8s.io/api/core/v1" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" @@ -30,9 +33,21 @@ import ( "github.com/stretchr/testify/assert" ) -var snapshots = map[string]func() ClusterSnapshot{ - "basic": func() ClusterSnapshot { return NewBasicClusterSnapshot() }, - "delta": func() ClusterSnapshot { return NewDeltaClusterSnapshot() }, +var snapshots = map[string]func() (clustersnapshot.ClusterSnapshot, error){ + "basic": func() (clustersnapshot.ClusterSnapshot, error) { + fwHandle, err := framework.NewTestFrameworkHandle() + if err != nil { + return nil, err + } + return NewPredicateSnapshot(base.NewBasicSnapshotBase(), fwHandle, false), nil + }, + "delta": func() (clustersnapshot.ClusterSnapshot, error) { + fwHandle, err := framework.NewTestFrameworkHandle() + if err != nil { + return nil, err + } + return NewPredicateSnapshot(base.NewDeltaSnapshotBase(), fwHandle, false), nil + }, } func nodeNames(nodes []*apiv1.Node) []string { @@ -61,7 +76,7 @@ func compareStates(t *testing.T, a, b snapshotState) { assert.ElementsMatch(t, a.pods, b.pods) } -func getSnapshotState(t *testing.T, snapshot ClusterSnapshot) snapshotState { +func getSnapshotState(t *testing.T, snapshot clustersnapshot.ClusterSnapshot) snapshotState { nodes, err := snapshot.ListNodeInfos() assert.NoError(t, err) var pods []*apiv1.Pod @@ -73,16 +88,17 @@ func getSnapshotState(t *testing.T, snapshot ClusterSnapshot) snapshotState { return snapshotState{extractNodes(nodes), pods} } -func startSnapshot(t *testing.T, snapshotFactory func() ClusterSnapshot, state snapshotState) ClusterSnapshot { - snapshot := snapshotFactory() - err := snapshot.SetClusterState(state.nodes, state.pods) +func startSnapshot(t *testing.T, snapshotFactory func() (clustersnapshot.ClusterSnapshot, error), state snapshotState) clustersnapshot.ClusterSnapshot { + snapshot, err := snapshotFactory() + assert.NoError(t, err) + err = snapshot.SetClusterState(state.nodes, state.pods, drasnapshot.Snapshot{}) assert.NoError(t, err) return snapshot } type modificationTestCase struct { name string - op func(ClusterSnapshot) + op func(clustersnapshot.ClusterSnapshot) state snapshotState modifiedState snapshotState } @@ -95,7 +111,7 @@ func validTestCases(t *testing.T) []modificationTestCase { testCases := []modificationTestCase{ { name: "add empty nodeInfo", - op: func(snapshot ClusterSnapshot) { + op: func(snapshot clustersnapshot.ClusterSnapshot) { err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) }, @@ -105,7 +121,7 @@ func validTestCases(t *testing.T) []modificationTestCase { }, { name: "add nodeInfo", - op: func(snapshot ClusterSnapshot) { + op: func(snapshot clustersnapshot.ClusterSnapshot) { err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, pod)) assert.NoError(t, err) }, @@ -119,7 +135,7 @@ func validTestCases(t *testing.T) []modificationTestCase { state: snapshotState{ nodes: []*apiv1.Node{node}, }, - op: func(snapshot ClusterSnapshot) { + op: func(snapshot clustersnapshot.ClusterSnapshot) { err := snapshot.RemoveNodeInfo(node.Name) assert.NoError(t, err) }, @@ -129,7 +145,7 @@ func validTestCases(t *testing.T) []modificationTestCase { state: snapshotState{ nodes: []*apiv1.Node{node}, }, - op: func(snapshot ClusterSnapshot) { + op: func(snapshot clustersnapshot.ClusterSnapshot) { err := snapshot.RemoveNodeInfo(node.Name) assert.NoError(t, err) @@ -145,10 +161,10 @@ func validTestCases(t *testing.T) []modificationTestCase { state: snapshotState{ nodes: []*apiv1.Node{node}, }, - op: func(snapshot ClusterSnapshot) { - err := snapshot.ForceAddPod(pod, node.Name) - assert.NoError(t, err) - err = snapshot.RemoveNodeInfo(node.Name) + op: func(snapshot clustersnapshot.ClusterSnapshot) { + schedErr := snapshot.ForceAddPod(pod, node.Name) + assert.NoError(t, schedErr) + err := snapshot.RemoveNodeInfo(node.Name) assert.NoError(t, err) }, }, @@ -284,20 +300,20 @@ func TestSetClusterState(t *testing.T) { extraNodeCount := localRand.Intn(100) extraPodCount := localRand.Intn(1000) - nodes := createTestNodes(nodeCount) - pods := createTestPods(podCount) - assignPodsToNodes(pods, nodes) + nodes := clustersnapshot.CreateTestNodes(nodeCount) + pods := clustersnapshot.CreateTestPods(podCount) + clustersnapshot.AssignTestPodsToNodes(pods, nodes) state := snapshotState{nodes, pods} - extraNodes := createTestNodesWithPrefix("extra", extraNodeCount) + extraNodes := clustersnapshot.CreateTestNodesWithPrefix("extra", extraNodeCount) allNodes := make([]*apiv1.Node, len(nodes)+len(extraNodes), len(nodes)+len(extraNodes)) copy(allNodes, nodes) copy(allNodes[len(nodes):], extraNodes) - extraPods := createTestPodsWithPrefix("extra", extraPodCount) - assignPodsToNodes(extraPods, allNodes) + extraPods := clustersnapshot.CreateTestPodsWithPrefix("extra", extraPodCount) + clustersnapshot.AssignTestPodsToNodes(extraPods, allNodes) allPods := make([]*apiv1.Pod, len(pods)+len(extraPods), len(pods)+len(extraPods)) copy(allPods, pods) @@ -309,7 +325,7 @@ func TestSetClusterState(t *testing.T) { snapshot := startSnapshot(t, snapshotFactory, state) compareStates(t, state, getSnapshotState(t, snapshot)) - assert.NoError(t, snapshot.SetClusterState(nil, nil)) + assert.NoError(t, snapshot.SetClusterState(nil, nil, drasnapshot.Snapshot{})) compareStates(t, snapshotState{}, getSnapshotState(t, snapshot)) }) @@ -318,9 +334,9 @@ func TestSetClusterState(t *testing.T) { snapshot := startSnapshot(t, snapshotFactory, state) compareStates(t, state, getSnapshotState(t, snapshot)) - newNodes, newPods := createTestNodes(13), createTestPods(37) - assignPodsToNodes(newPods, newNodes) - assert.NoError(t, snapshot.SetClusterState(newNodes, newPods)) + newNodes, newPods := clustersnapshot.CreateTestNodes(13), clustersnapshot.CreateTestPods(37) + clustersnapshot.AssignTestPodsToNodes(newPods, newNodes) + assert.NoError(t, snapshot.SetClusterState(newNodes, newPods, drasnapshot.Snapshot{})) compareStates(t, snapshotState{nodes: newNodes, pods: newPods}, getSnapshotState(t, snapshot)) }) @@ -343,7 +359,7 @@ func TestSetClusterState(t *testing.T) { compareStates(t, snapshotState{allNodes, allPods}, getSnapshotState(t, snapshot)) - assert.NoError(t, snapshot.SetClusterState(nil, nil)) + assert.NoError(t, snapshot.SetClusterState(nil, nil, drasnapshot.Snapshot{})) compareStates(t, snapshotState{}, getSnapshotState(t, snapshot)) @@ -357,19 +373,19 @@ func TestNode404(t *testing.T) { // Anything and everything that returns errNodeNotFound should be tested here. ops := []struct { name string - op func(ClusterSnapshot) error + op func(clustersnapshot.ClusterSnapshot) error }{ - {"add pod", func(snapshot ClusterSnapshot) error { + {"add pod", func(snapshot clustersnapshot.ClusterSnapshot) error { return snapshot.ForceAddPod(BuildTestPod("p1", 0, 0), "node") }}, - {"remove pod", func(snapshot ClusterSnapshot) error { + {"remove pod", func(snapshot clustersnapshot.ClusterSnapshot) error { return snapshot.ForceRemovePod("default", "p1", "node") }}, - {"get node", func(snapshot ClusterSnapshot) error { + {"get node", func(snapshot clustersnapshot.ClusterSnapshot) error { _, err := snapshot.NodeInfos().Get("node") return err }}, - {"remove nodeInfo", func(snapshot ClusterSnapshot) error { + {"remove nodeInfo", func(snapshot clustersnapshot.ClusterSnapshot) error { return snapshot.RemoveNodeInfo("node") }}, } @@ -378,19 +394,21 @@ func TestNode404(t *testing.T) { for _, op := range ops { t.Run(fmt.Sprintf("%s: %s empty", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) // Empty snapshot - shouldn't be able to operate on nodes that are not here. - err := op.op(snapshot) + err = op.op(snapshot) assert.Error(t, err) }) t.Run(fmt.Sprintf("%s: %s fork", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) node := BuildTestNode("node", 10, 100) - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) snapshot.Fork() @@ -413,10 +431,11 @@ func TestNode404(t *testing.T) { t.Run(fmt.Sprintf("%s: %s base", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) node := BuildTestNode("node", 10, 100) - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) err = snapshot.RemoveNodeInfo("node") @@ -437,9 +456,9 @@ func TestNodeAlreadyExists(t *testing.T) { ops := []struct { name string - op func(ClusterSnapshot) error + op func(clustersnapshot.ClusterSnapshot) error }{ - {"add nodeInfo", func(snapshot ClusterSnapshot) error { + {"add nodeInfo", func(snapshot clustersnapshot.ClusterSnapshot) error { return snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, pod)) }}, } @@ -448,9 +467,10 @@ func TestNodeAlreadyExists(t *testing.T) { for _, op := range ops { t.Run(fmt.Sprintf("%s: %s base", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) // Node already in base. @@ -460,9 +480,10 @@ func TestNodeAlreadyExists(t *testing.T) { t.Run(fmt.Sprintf("%s: %s base, forked", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) snapshot.Fork() @@ -475,11 +496,12 @@ func TestNodeAlreadyExists(t *testing.T) { t.Run(fmt.Sprintf("%s: %s fork", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) snapshot.Fork() - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) // Node already in fork. @@ -488,11 +510,12 @@ func TestNodeAlreadyExists(t *testing.T) { }) t.Run(fmt.Sprintf("%s: %s committed", name, op.name), func(t *testing.T) { - snapshot := snapshotFactory() + snapshot, err := snapshotFactory() + assert.NoError(t, err) snapshot.Fork() - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) assert.NoError(t, err) err = snapshot.Commit() @@ -628,8 +651,9 @@ func TestPVCUsedByPods(t *testing.T) { for snapshotName, snapshotFactory := range snapshots { for _, tc := range testcase { t.Run(fmt.Sprintf("%s with snapshot (%s)", tc.desc, snapshotName), func(t *testing.T) { - snapshot := snapshotFactory() - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(tc.node, tc.pods...)) + snapshot, err := snapshotFactory() + assert.NoError(t, err) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(tc.node, tc.pods...)) assert.NoError(t, err) volumeExists := snapshot.StorageInfos().IsPVCUsedByPods(schedulerframework.GetNamespacedName("default", tc.claimName)) @@ -698,8 +722,9 @@ func TestPVCClearAndFork(t *testing.T) { for snapshotName, snapshotFactory := range snapshots { t.Run(fmt.Sprintf("fork and revert snapshot with pvc pods with snapshot: %s", snapshotName), func(t *testing.T) { - snapshot := snapshotFactory() - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, pod1)) + snapshot, err := snapshotFactory() + assert.NoError(t, err) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, pod1)) assert.NoError(t, err) volumeExists := snapshot.StorageInfos().IsPVCUsedByPods(schedulerframework.GetNamespacedName("default", "claim1")) assert.Equal(t, true, volumeExists) @@ -723,13 +748,14 @@ func TestPVCClearAndFork(t *testing.T) { }) t.Run(fmt.Sprintf("clear snapshot with pvc pods with snapshot: %s", snapshotName), func(t *testing.T) { - snapshot := snapshotFactory() - err := snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, pod1)) + snapshot, err := snapshotFactory() + assert.NoError(t, err) + err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node, pod1)) assert.NoError(t, err) volumeExists := snapshot.StorageInfos().IsPVCUsedByPods(schedulerframework.GetNamespacedName("default", "claim1")) assert.Equal(t, true, volumeExists) - assert.NoError(t, snapshot.SetClusterState(nil, nil)) + assert.NoError(t, snapshot.SetClusterState(nil, nil, drasnapshot.Snapshot{})) volumeExists = snapshot.StorageInfos().IsPVCUsedByPods(schedulerframework.GetNamespacedName("default", "claim1")) assert.Equal(t, false, volumeExists) @@ -752,7 +778,7 @@ func TestWithForkedSnapshot(t *testing.T) { return false, err } t.Run(fmt.Sprintf("%s: %s WithForkedSnapshot for failed function", name, tc.name), func(t *testing.T) { - err1, err2 := WithForkedSnapshot(snapshot, failedFunc) + err1, err2 := clustersnapshot.WithForkedSnapshot(snapshot, failedFunc) assert.Error(t, err1) assert.NoError(t, err2) @@ -760,7 +786,7 @@ func TestWithForkedSnapshot(t *testing.T) { compareStates(t, tc.state, getSnapshotState(t, snapshot)) }) t.Run(fmt.Sprintf("%s: %s WithForkedSnapshot for success function", name, tc.name), func(t *testing.T) { - err1, err2 := WithForkedSnapshot(snapshot, successFunc) + err1, err2 := clustersnapshot.WithForkedSnapshot(snapshot, successFunc) assert.Error(t, err1) assert.NoError(t, err2) diff --git a/cluster-autoscaler/simulator/clustersnapshot/test_utils.go b/cluster-autoscaler/simulator/clustersnapshot/test_utils.go index f0cd8c67546e..3587b64639d9 100644 --- a/cluster-autoscaler/simulator/clustersnapshot/test_utils.go +++ b/cluster-autoscaler/simulator/clustersnapshot/test_utils.go @@ -17,12 +17,17 @@ limitations under the License. package clustersnapshot import ( + "fmt" + "math" "testing" + "time" "github.com/stretchr/testify/assert" apiv1 "k8s.io/api/core/v1" + drasnapshot "k8s.io/autoscaler/cluster-autoscaler/simulator/dynamicresources/snapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + "k8s.io/autoscaler/cluster-autoscaler/utils/test" ) // InitializeClusterSnapshotOrDie clears cluster snapshot and then initializes it with given set of nodes and pods. @@ -34,7 +39,7 @@ func InitializeClusterSnapshotOrDie( pods []*apiv1.Pod) { var err error - assert.NoError(t, snapshot.SetClusterState(nil, nil)) + assert.NoError(t, snapshot.SetClusterState(nil, nil, drasnapshot.Snapshot{})) for _, node := range nodes { err = snapshot.AddNodeInfo(framework.NewTestNodeInfo(node)) @@ -53,3 +58,48 @@ func InitializeClusterSnapshotOrDie( } } } + +// CreateTestNodesWithPrefix creates n test Nodes with the given name prefix. +func CreateTestNodesWithPrefix(prefix string, n int) []*apiv1.Node { + nodes := make([]*apiv1.Node, n, n) + for i := 0; i < n; i++ { + nodes[i] = test.BuildTestNode(fmt.Sprintf("%s-%d", prefix, i), math.MaxInt, math.MaxInt) + test.SetNodeReadyState(nodes[i], true, time.Time{}) + } + return nodes +} + +// CreateTestNodes creates n test Nodes. +func CreateTestNodes(n int) []*apiv1.Node { + return CreateTestNodesWithPrefix("n", n) +} + +// CreateTestPodsWithPrefix creates n test Pods with the given name prefix. +func CreateTestPodsWithPrefix(prefix string, n int) []*apiv1.Pod { + pods := make([]*apiv1.Pod, n, n) + for i := 0; i < n; i++ { + pods[i] = test.BuildTestPod(fmt.Sprintf("%s-%d", prefix, i), 1, 1) + } + return pods +} + +// CreateTestPods creates n test Pods. +func CreateTestPods(n int) []*apiv1.Pod { + return CreateTestPodsWithPrefix("p", n) +} + +// AssignTestPodsToNodes assigns test pods to test nodes based on their index position. +func AssignTestPodsToNodes(pods []*apiv1.Pod, nodes []*apiv1.Node) { + if len(nodes) == 0 { + return + } + + j := 0 + for i := 0; i < len(pods); i++ { + if j >= len(nodes) { + j = 0 + } + pods[i].Spec.NodeName = nodes[j].Name + j++ + } +} diff --git a/cluster-autoscaler/simulator/clustersnapshot/testsnapshot/test_snapshot.go b/cluster-autoscaler/simulator/clustersnapshot/testsnapshot/test_snapshot.go new file mode 100644 index 000000000000..dcbd93b4928e --- /dev/null +++ b/cluster-autoscaler/simulator/clustersnapshot/testsnapshot/test_snapshot.go @@ -0,0 +1,65 @@ +/* +Copyright 2024 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package testsnapshot + +import ( + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/base" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/predicate" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" +) + +// testFailer is an abstraction that covers both *testing.T and *testing.B. +type testFailer interface { + Fatalf(format string, args ...any) +} + +// NewTestSnapshot returns an instance of ClusterSnapshot that can be used in tests. +func NewTestSnapshot() (clustersnapshot.ClusterSnapshot, error) { + testFwHandle, err := framework.NewTestFrameworkHandle() + if err != nil { + return nil, err + } + return predicate.NewPredicateSnapshot(base.NewBasicSnapshotBase(), testFwHandle, true), nil +} + +// NewTestSnapshotOrDie returns an instance of ClusterSnapshot that can be used in tests. +func NewTestSnapshotOrDie(t testFailer) clustersnapshot.ClusterSnapshot { + snapshot, err := NewTestSnapshot() + if err != nil { + t.Fatalf("NewTestSnapshotOrDie: couldn't create test ClusterSnapshot: %v", err) + } + return snapshot +} + +// NewCustomTestSnapshot returns an instance of ClusterSnapshot with a specific SnapshotBase that can be used in tests. +func NewCustomTestSnapshot(snapshot clustersnapshot.SnapshotBase) (clustersnapshot.ClusterSnapshot, error) { + testFwHandle, err := framework.NewTestFrameworkHandle() + if err != nil { + return nil, err + } + return predicate.NewPredicateSnapshot(snapshot, testFwHandle, true), nil +} + +// NewCustomTestSnapshotOrDie returns an instance of ClusterSnapshot with a specific SnapshotBase that can be used in tests. +func NewCustomTestSnapshotOrDie(t testFailer, snapshot clustersnapshot.SnapshotBase) clustersnapshot.ClusterSnapshot { + result, err := NewCustomTestSnapshot(snapshot) + if err != nil { + t.Fatalf("NewCustomTestSnapshotOrDie: couldn't create test ClusterSnapshot: %v", err) + } + return result +} diff --git a/cluster-autoscaler/simulator/dynamicresources/snapshot/snapshot.go b/cluster-autoscaler/simulator/dynamicresources/snapshot/snapshot.go new file mode 100644 index 000000000000..587115cfb17c --- /dev/null +++ b/cluster-autoscaler/simulator/dynamicresources/snapshot/snapshot.go @@ -0,0 +1,48 @@ +/* +Copyright 2024 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package snapshot + +import ( + schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" +) + +// Snapshot contains a snapshot of all DRA objects taken at a ~single point in time. +type Snapshot struct { +} + +// ResourceClaims exposes the Snapshot as schedulerframework.ResourceClaimTracker, in order to interact with +// the scheduler framework. +func (s Snapshot) ResourceClaims() schedulerframework.ResourceClaimTracker { + return nil +} + +// ResourceSlices exposes the Snapshot as schedulerframework.ResourceSliceLister, in order to interact with +// the scheduler framework. +func (s Snapshot) ResourceSlices() schedulerframework.ResourceSliceLister { + return nil +} + +// DeviceClasses exposes the Snapshot as schedulerframework.DeviceClassLister, in order to interact with +// the scheduler framework. +func (s Snapshot) DeviceClasses() schedulerframework.DeviceClassLister { + return nil +} + +// Clone returns a copy of this Snapshot that can be independently modified without affecting this Snapshot. +func (s Snapshot) Clone() Snapshot { + return Snapshot{} +} diff --git a/cluster-autoscaler/simulator/framework/delegating_shared_lister.go b/cluster-autoscaler/simulator/framework/delegating_shared_lister.go new file mode 100644 index 000000000000..c57f873df6fa --- /dev/null +++ b/cluster-autoscaler/simulator/framework/delegating_shared_lister.go @@ -0,0 +1,182 @@ +/* +Copyright 2020 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package framework + +import ( + "fmt" + + resourceapi "k8s.io/api/resource/v1beta1" + "k8s.io/apimachinery/pkg/types" + "k8s.io/apimachinery/pkg/util/sets" + "k8s.io/dynamic-resource-allocation/structured" + "k8s.io/klog/v2" + schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" +) + +// SharedLister groups all interfaces that Cluster Autoscaler needs to implement for integrating with kube-scheduler. +type SharedLister interface { + schedulerframework.SharedLister + schedulerframework.SharedDRAManager +} + +// DelegatingSchedulerSharedLister implements schedulerframework interfaces by passing the logic to a delegate. Delegate can be updated. +type DelegatingSchedulerSharedLister struct { + delegate SharedLister +} + +// NewDelegatingSchedulerSharedLister creates new NewDelegatingSchedulerSharedLister +func NewDelegatingSchedulerSharedLister() *DelegatingSchedulerSharedLister { + return &DelegatingSchedulerSharedLister{ + delegate: unsetSharedListerSingleton, + } +} + +// NodeInfos returns a NodeInfoLister. +func (lister *DelegatingSchedulerSharedLister) NodeInfos() schedulerframework.NodeInfoLister { + return lister.delegate.NodeInfos() +} + +// StorageInfos returns a StorageInfoLister +func (lister *DelegatingSchedulerSharedLister) StorageInfos() schedulerframework.StorageInfoLister { + return lister.delegate.StorageInfos() +} + +// ResourceClaims returns a ResourceClaimTracker. +func (lister *DelegatingSchedulerSharedLister) ResourceClaims() schedulerframework.ResourceClaimTracker { + return lister.delegate.ResourceClaims() +} + +// ResourceSlices returns a ResourceSliceLister. +func (lister *DelegatingSchedulerSharedLister) ResourceSlices() schedulerframework.ResourceSliceLister { + return lister.delegate.ResourceSlices() +} + +// DeviceClasses returns a DeviceClassLister. +func (lister *DelegatingSchedulerSharedLister) DeviceClasses() schedulerframework.DeviceClassLister { + return lister.delegate.DeviceClasses() +} + +// UpdateDelegate updates the delegate +func (lister *DelegatingSchedulerSharedLister) UpdateDelegate(delegate SharedLister) { + lister.delegate = delegate +} + +// ResetDelegate resets delegate to +func (lister *DelegatingSchedulerSharedLister) ResetDelegate() { + lister.delegate = unsetSharedListerSingleton +} + +type unsetSharedLister struct{} +type unsetNodeInfoLister unsetSharedLister +type unsetStorageInfoLister unsetSharedLister +type unsetResourceClaimTracker unsetSharedLister +type unsetResourceSliceLister unsetSharedLister +type unsetDeviceClassLister unsetSharedLister + +// List always returns an error +func (lister *unsetNodeInfoLister) List() ([]*schedulerframework.NodeInfo, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +// HavePodsWithAffinityList always returns an error +func (lister *unsetNodeInfoLister) HavePodsWithAffinityList() ([]*schedulerframework.NodeInfo, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +// HavePodsWithRequiredAntiAffinityList always returns an error. +func (lister *unsetNodeInfoLister) HavePodsWithRequiredAntiAffinityList() ([]*schedulerframework.NodeInfo, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +// Get always returns an error +func (lister *unsetNodeInfoLister) Get(nodeName string) (*schedulerframework.NodeInfo, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +func (lister *unsetStorageInfoLister) IsPVCUsedByPods(key string) bool { + return false +} + +func (u unsetResourceClaimTracker) List() ([]*resourceapi.ResourceClaim, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +func (u unsetResourceClaimTracker) Get(namespace, claimName string) (*resourceapi.ResourceClaim, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +func (u unsetResourceClaimTracker) ListAllAllocatedDevices() (sets.Set[structured.DeviceID], error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +func (u unsetResourceClaimTracker) SignalClaimPendingAllocation(claimUID types.UID, allocatedClaim *resourceapi.ResourceClaim) error { + return fmt.Errorf("lister not set in delegate") +} + +func (u unsetResourceClaimTracker) ClaimHasPendingAllocation(claimUID types.UID) bool { + klog.Errorf("lister not set in delegate") + return false +} + +func (u unsetResourceClaimTracker) RemoveClaimPendingAllocation(claimUID types.UID) (deleted bool) { + klog.Errorf("lister not set in delegate") + return false +} + +func (u unsetResourceClaimTracker) AssumeClaimAfterAPICall(claim *resourceapi.ResourceClaim) error { + return fmt.Errorf("lister not set in delegate") +} + +func (u unsetResourceClaimTracker) AssumedClaimRestore(namespace, claimName string) { + klog.Errorf("lister not set in delegate") +} + +func (u unsetResourceSliceLister) List() ([]*resourceapi.ResourceSlice, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +func (u unsetDeviceClassLister) List() ([]*resourceapi.DeviceClass, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +func (u unsetDeviceClassLister) Get(className string) (*resourceapi.DeviceClass, error) { + return nil, fmt.Errorf("lister not set in delegate") +} + +// NodeInfos returns a fake NodeInfoLister which always returns an error +func (lister *unsetSharedLister) NodeInfos() schedulerframework.NodeInfoLister { + return (*unsetNodeInfoLister)(lister) +} + +// StorageInfos returns a fake StorageInfoLister which always returns an error +func (lister *unsetSharedLister) StorageInfos() schedulerframework.StorageInfoLister { + return (*unsetStorageInfoLister)(lister) +} + +func (lister *unsetSharedLister) ResourceClaims() schedulerframework.ResourceClaimTracker { + return (*unsetResourceClaimTracker)(lister) +} + +func (lister *unsetSharedLister) ResourceSlices() schedulerframework.ResourceSliceLister { + return (*unsetResourceSliceLister)(lister) +} + +func (lister *unsetSharedLister) DeviceClasses() schedulerframework.DeviceClassLister { + return (*unsetDeviceClassLister)(lister) +} + +var unsetSharedListerSingleton *unsetSharedLister diff --git a/cluster-autoscaler/simulator/framework/handle.go b/cluster-autoscaler/simulator/framework/handle.go new file mode 100644 index 000000000000..83a7516194f7 --- /dev/null +++ b/cluster-autoscaler/simulator/framework/handle.go @@ -0,0 +1,99 @@ +/* +Copyright 2024 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package framework + +import ( + "context" + "fmt" + + "k8s.io/client-go/informers" + "k8s.io/kubernetes/pkg/scheduler/apis/config" + scheduler_config "k8s.io/kubernetes/pkg/scheduler/apis/config/latest" + schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" + scheduler_plugins "k8s.io/kubernetes/pkg/scheduler/framework/plugins" + draplugin "k8s.io/kubernetes/pkg/scheduler/framework/plugins/dynamicresources" + schedulerframeworkruntime "k8s.io/kubernetes/pkg/scheduler/framework/runtime" + schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" +) + +// Handle is meant for interacting with the scheduler framework. +type Handle struct { + Framework schedulerframework.Framework + DelegatingLister *DelegatingSchedulerSharedLister +} + +// NewHandle builds a framework Handle based on the provided informers and scheduler config. +func NewHandle(informerFactory informers.SharedInformerFactory, schedConfig *config.KubeSchedulerConfiguration, draEnabled bool) (*Handle, error) { + if schedConfig == nil { + var err error + schedConfig, err = scheduler_config.Default() + if err != nil { + return nil, fmt.Errorf("couldn't create scheduler config: %v", err) + } + } + if len(schedConfig.Profiles) != 1 { + return nil, fmt.Errorf("unexpected scheduler config: expected one scheduler profile only (found %d profiles)", len(schedConfig.Profiles)) + } + schedProfile := &schedConfig.Profiles[0] + + sharedLister := NewDelegatingSchedulerSharedLister() + opts := []schedulerframeworkruntime.Option{ + schedulerframeworkruntime.WithInformerFactory(informerFactory), + schedulerframeworkruntime.WithSnapshotSharedLister(sharedLister), + } + + if draEnabled { + schedProfile = profileWithDraPlugin(schedProfile) + opts = append(opts, schedulerframeworkruntime.WithSharedDRAManager(sharedLister)) + } + + schedulermetrics.InitMetrics() + framework, err := schedulerframeworkruntime.NewFramework( + context.TODO(), + scheduler_plugins.NewInTreeRegistry(), + schedProfile, + opts..., + ) + + if err != nil { + return nil, fmt.Errorf("couldn't create scheduler framework; %v", err) + } + + return &Handle{ + Framework: framework, + DelegatingLister: sharedLister, + }, nil +} + +func profileWithDraPlugin(profile *config.KubeSchedulerProfile) *config.KubeSchedulerProfile { + result := profile.DeepCopy() + addPluginIfNotPresent(result.Plugins.PreFilter, draplugin.Name) + addPluginIfNotPresent(result.Plugins.Filter, draplugin.Name) + addPluginIfNotPresent(result.Plugins.Reserve, draplugin.Name) + return result +} + +func addPluginIfNotPresent(pluginSet config.PluginSet, pluginName string) { + for _, plugin := range pluginSet.Enabled { + if plugin.Name == pluginName { + // Plugin already present in the set. + return + } + } + // Plugin not present in the set, add it. + pluginSet.Enabled = append(pluginSet.Enabled, config.Plugin{Name: pluginName}) +} diff --git a/cluster-autoscaler/simulator/framework/infos.go b/cluster-autoscaler/simulator/framework/infos.go index c3af45d08258..2759124e3c49 100644 --- a/cluster-autoscaler/simulator/framework/infos.go +++ b/cluster-autoscaler/simulator/framework/infos.go @@ -18,7 +18,7 @@ package framework import ( apiv1 "k8s.io/api/core/v1" - resourceapi "k8s.io/api/resource/v1alpha3" + resourceapi "k8s.io/api/resource/v1beta1" "k8s.io/apimachinery/pkg/types" "k8s.io/klog/v2" schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" @@ -28,22 +28,24 @@ import ( type PodInfo struct { // This type embeds *apiv1.Pod to make the accesses easier - most of the code just needs to access the Pod. *apiv1.Pod + // PodExtraInfo is an embedded struct containing all additional information that CA needs to track about a Pod. + PodExtraInfo +} +// PodExtraInfo contains all necessary information about a Pod that Cluster Autoscaler needs to track, apart from the Pod itself. +// This is extracted from PodInfo so that it can be stored separately from the Pod. +type PodExtraInfo struct { // NeededResourceClaims contains ResourceClaim objects needed by the Pod. NeededResourceClaims []*resourceapi.ResourceClaim } -type podExtraInfo struct { - neededResourceClaims []*resourceapi.ResourceClaim -} - // NodeInfo contains all necessary information about a Node that Cluster Autoscaler needs to track. // It's essentially a wrapper around schedulerframework.NodeInfo, with extra data on top. type NodeInfo struct { // schedNodeInfo is the part of information needed by the scheduler. schedNodeInfo *schedulerframework.NodeInfo // podsExtraInfo contains extra pod-level data needed only by CA. - podsExtraInfo map[types.UID]podExtraInfo + podsExtraInfo map[types.UID]PodExtraInfo // Extra node-level data needed only by CA below. @@ -66,7 +68,7 @@ func (n *NodeInfo) Pods() []*PodInfo { var result []*PodInfo for _, pod := range n.schedNodeInfo.Pods { extraInfo := n.podsExtraInfo[pod.Pod.UID] - podInfo := &PodInfo{Pod: pod.Pod, NeededResourceClaims: extraInfo.neededResourceClaims} + podInfo := &PodInfo{Pod: pod.Pod, PodExtraInfo: extraInfo} result = append(result, podInfo) } return result @@ -75,7 +77,7 @@ func (n *NodeInfo) Pods() []*PodInfo { // AddPod adds the given Pod and associated data to the NodeInfo. func (n *NodeInfo) AddPod(pod *PodInfo) { n.schedNodeInfo.AddPod(pod.Pod) - n.podsExtraInfo[pod.UID] = podExtraInfo{neededResourceClaims: pod.NeededResourceClaims} + n.podsExtraInfo[pod.UID] = pod.PodExtraInfo } // RemovePod removes the given pod and its associated data from the NodeInfo. @@ -93,11 +95,28 @@ func (n *NodeInfo) ToScheduler() *schedulerframework.NodeInfo { return n.schedNodeInfo } +// DeepCopy clones the NodeInfo. +func (n *NodeInfo) DeepCopy() *NodeInfo { + var newPods []*PodInfo + for _, podInfo := range n.Pods() { + var newClaims []*resourceapi.ResourceClaim + for _, claim := range podInfo.NeededResourceClaims { + newClaims = append(newClaims, claim.DeepCopy()) + } + newPods = append(newPods, &PodInfo{Pod: podInfo.Pod.DeepCopy(), PodExtraInfo: PodExtraInfo{NeededResourceClaims: newClaims}}) + } + var newSlices []*resourceapi.ResourceSlice + for _, slice := range n.LocalResourceSlices { + newSlices = append(newSlices, slice.DeepCopy()) + } + return NewNodeInfo(n.Node().DeepCopy(), newSlices, newPods...) +} + // NewNodeInfo returns a new internal NodeInfo from the provided data. func NewNodeInfo(node *apiv1.Node, slices []*resourceapi.ResourceSlice, pods ...*PodInfo) *NodeInfo { result := &NodeInfo{ schedNodeInfo: schedulerframework.NewNodeInfo(), - podsExtraInfo: map[types.UID]podExtraInfo{}, + podsExtraInfo: map[types.UID]PodExtraInfo{}, LocalResourceSlices: slices, } if node != nil { @@ -110,18 +129,15 @@ func NewNodeInfo(node *apiv1.Node, slices []*resourceapi.ResourceSlice, pods ... } // WrapSchedulerNodeInfo wraps a *schedulerframework.NodeInfo into an internal *NodeInfo. -func WrapSchedulerNodeInfo(schedNodeInfo *schedulerframework.NodeInfo) *NodeInfo { +func WrapSchedulerNodeInfo(schedNodeInfo *schedulerframework.NodeInfo, slices []*resourceapi.ResourceSlice, podExtraInfos map[types.UID]PodExtraInfo) *NodeInfo { return &NodeInfo{ - schedNodeInfo: schedNodeInfo, - podsExtraInfo: map[types.UID]podExtraInfo{}, + schedNodeInfo: schedNodeInfo, + podsExtraInfo: podExtraInfos, + LocalResourceSlices: slices, } } -// WrapSchedulerNodeInfos wraps a list of *schedulerframework.NodeInfos into internal *NodeInfos. -func WrapSchedulerNodeInfos(schedNodeInfos []*schedulerframework.NodeInfo) []*NodeInfo { - var result []*NodeInfo - for _, schedNodeInfo := range schedNodeInfos { - result = append(result, WrapSchedulerNodeInfo(schedNodeInfo)) - } - return result +// NewPodInfo is a convenience function for creating new PodInfos without typing out the "PodExtraInfo" part. +func NewPodInfo(pod *apiv1.Pod, claims []*resourceapi.ResourceClaim) *PodInfo { + return &PodInfo{Pod: pod, PodExtraInfo: PodExtraInfo{NeededResourceClaims: claims}} } diff --git a/cluster-autoscaler/simulator/framework/infos_test.go b/cluster-autoscaler/simulator/framework/infos_test.go index e6f997129253..5413c1d0939a 100644 --- a/cluster-autoscaler/simulator/framework/infos_test.go +++ b/cluster-autoscaler/simulator/framework/infos_test.go @@ -24,7 +24,7 @@ import ( "github.com/google/go-cmp/cmp/cmpopts" apiv1 "k8s.io/api/core/v1" - resourceapi "k8s.io/api/resource/v1alpha3" + resourceapi "k8s.io/api/resource/v1beta1" v1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/apimachinery/pkg/types" "k8s.io/autoscaler/cluster-autoscaler/utils/test" @@ -105,11 +105,27 @@ func TestNodeInfo(t *testing.T) { wantPods: testPodInfos(pods, false), }, { - testName: "wrapping via WrapSchedulerNodeInfo", - modFn: WrapSchedulerNodeInfo, + testName: "wrapping via WrapSchedulerNodeInfo", + modFn: func(info *schedulerframework.NodeInfo) *NodeInfo { + return WrapSchedulerNodeInfo(schedulerNodeInfo, nil, nil) + }, wantSchedNodeInfo: schedulerNodeInfo, wantPods: testPodInfos(pods, false), }, + { + testName: "wrapping via WrapSchedulerNodeInfo with DRA objects", + modFn: func(info *schedulerframework.NodeInfo) *NodeInfo { + podInfos := testPodInfos(pods, true) + extraInfos := make(map[types.UID]PodExtraInfo) + for _, podInfo := range podInfos { + extraInfos[podInfo.Pod.UID] = podInfo.PodExtraInfo + } + return WrapSchedulerNodeInfo(schedulerNodeInfo, slices, extraInfos) + }, + wantSchedNodeInfo: schedulerNodeInfo, + wantLocalResourceSlices: slices, + wantPods: testPodInfos(pods, true), + }, { testName: "wrapping via SetNode+AddPod", modFn: func(info *schedulerframework.NodeInfo) *NodeInfo { @@ -208,6 +224,66 @@ func TestNodeInfo(t *testing.T) { } } +func TestDeepCopyNodeInfo(t *testing.T) { + node := test.BuildTestNode("node", 1000, 1000) + pods := []*PodInfo{ + {Pod: test.BuildTestPod("p1", 80, 0, test.WithNodeName(node.Name))}, + { + Pod: test.BuildTestPod("p2", 80, 0, test.WithNodeName(node.Name)), + PodExtraInfo: PodExtraInfo{ + NeededResourceClaims: []*resourceapi.ResourceClaim{ + {ObjectMeta: v1.ObjectMeta{Name: "claim1"}, Spec: resourceapi.ResourceClaimSpec{Devices: resourceapi.DeviceClaim{Requests: []resourceapi.DeviceRequest{{Name: "req1"}}}}}, + {ObjectMeta: v1.ObjectMeta{Name: "claim2"}, Spec: resourceapi.ResourceClaimSpec{Devices: resourceapi.DeviceClaim{Requests: []resourceapi.DeviceRequest{{Name: "req2"}}}}}, + }, + }, + }, + } + slices := []*resourceapi.ResourceSlice{ + {ObjectMeta: v1.ObjectMeta{Name: "slice1"}, Spec: resourceapi.ResourceSliceSpec{NodeName: "node"}}, + {ObjectMeta: v1.ObjectMeta{Name: "slice2"}, Spec: resourceapi.ResourceSliceSpec{NodeName: "node"}}, + } + nodeInfo := NewNodeInfo(node, slices, pods...) + + // Verify that the contents are identical after copying. + nodeInfoCopy := nodeInfo.DeepCopy() + if diff := cmp.Diff(nodeInfo, nodeInfoCopy, + cmp.AllowUnexported(schedulerframework.NodeInfo{}, NodeInfo{}, PodInfo{}), + // We don't care about this field staying the same, and it differs because it's a global counter bumped + // on every AddPod. + cmpopts.IgnoreFields(schedulerframework.NodeInfo{}, "Generation"), + ); diff != "" { + t.Errorf("nodeInfo differs after DeepCopyNodeInfo, diff (-want +got): %s", diff) + } + + // Verify that the object addresses changed in the copy. + if nodeInfo == nodeInfoCopy { + t.Error("nodeInfo address identical after DeepCopyNodeInfo") + } + if nodeInfo.ToScheduler() == nodeInfoCopy.ToScheduler() { + t.Error("schedulerframework.NodeInfo address identical after DeepCopyNodeInfo") + } + for i := range len(nodeInfo.LocalResourceSlices) { + if nodeInfo.LocalResourceSlices[i] == nodeInfoCopy.LocalResourceSlices[i] { + t.Errorf("%d-th LocalResourceSlice address identical after DeepCopyNodeInfo", i) + } + } + for podIndex := range len(pods) { + oldPodInfo := nodeInfo.Pods()[podIndex] + newPodInfo := nodeInfoCopy.Pods()[podIndex] + if oldPodInfo == newPodInfo { + t.Errorf("%d-th PodInfo address identical after DeepCopyNodeInfo", podIndex) + } + if oldPodInfo.Pod == newPodInfo.Pod { + t.Errorf("%d-th PodInfo.Pod address identical after DeepCopyNodeInfo", podIndex) + } + for claimIndex := range len(newPodInfo.NeededResourceClaims) { + if oldPodInfo.NeededResourceClaims[podIndex] == newPodInfo.NeededResourceClaims[podIndex] { + t.Errorf("%d-th PodInfo - %d-th NeededResourceClaim address identical after DeepCopyNodeInfo", podIndex, claimIndex) + } + } + } +} + func testPodInfos(pods []*apiv1.Pod, addClaims bool) []*PodInfo { var result []*PodInfo for _, pod := range pods { diff --git a/cluster-autoscaler/simulator/framework/test_utils.go b/cluster-autoscaler/simulator/framework/test_utils.go index 9cdfd45eccd1..ba8489121c2b 100644 --- a/cluster-autoscaler/simulator/framework/test_utils.go +++ b/cluster-autoscaler/simulator/framework/test_utils.go @@ -18,14 +18,44 @@ package framework import ( apiv1 "k8s.io/api/core/v1" + "k8s.io/client-go/informers" + clientsetfake "k8s.io/client-go/kubernetes/fake" + scheduler_config_latest "k8s.io/kubernetes/pkg/scheduler/apis/config/latest" ) +// testFailer is an abstraction that covers both *testing.T and *testing.B. +type testFailer interface { + Fatalf(format string, args ...any) +} + // NewTestNodeInfo returns a new NodeInfo without any DRA information - only to be used in test code. // Production code should always take DRA objects into account. func NewTestNodeInfo(node *apiv1.Node, pods ...*apiv1.Pod) *NodeInfo { nodeInfo := NewNodeInfo(node, nil) for _, pod := range pods { - nodeInfo.AddPod(&PodInfo{Pod: pod, NeededResourceClaims: nil}) + nodeInfo.AddPod(NewPodInfo(pod, nil)) } return nodeInfo } + +// NewTestFrameworkHandle creates a Handle that can be used in tests. +func NewTestFrameworkHandle() (*Handle, error) { + defaultConfig, err := scheduler_config_latest.Default() + if err != nil { + return nil, err + } + fwHandle, err := NewHandle(informers.NewSharedInformerFactory(clientsetfake.NewSimpleClientset(), 0), defaultConfig, true) + if err != nil { + return nil, err + } + return fwHandle, nil +} + +// NewTestFrameworkHandleOrDie creates a Handle that can be used in tests. +func NewTestFrameworkHandleOrDie(t testFailer) *Handle { + handle, err := NewTestFrameworkHandle() + if err != nil { + t.Fatalf("TestFrameworkHandleOrDie: couldn't create test framework handle: %v", err) + } + return handle +} diff --git a/cluster-autoscaler/simulator/node_info_utils.go b/cluster-autoscaler/simulator/node_info_utils.go new file mode 100644 index 000000000000..fe76dd925824 --- /dev/null +++ b/cluster-autoscaler/simulator/node_info_utils.go @@ -0,0 +1,153 @@ +/* +Copyright 2024 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package simulator + +import ( + "fmt" + "math/rand" + + appsv1 "k8s.io/api/apps/v1" + apiv1 "k8s.io/api/core/v1" + metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" + "k8s.io/apimachinery/pkg/types" + "k8s.io/apimachinery/pkg/util/uuid" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + "k8s.io/autoscaler/cluster-autoscaler/utils/daemonset" + "k8s.io/autoscaler/cluster-autoscaler/utils/errors" + "k8s.io/autoscaler/cluster-autoscaler/utils/labels" + pod_util "k8s.io/autoscaler/cluster-autoscaler/utils/pod" + "k8s.io/autoscaler/cluster-autoscaler/utils/taints" +) + +type nodeGroupTemplateNodeInfoGetter interface { + Id() string + TemplateNodeInfo() (*framework.NodeInfo, error) +} + +// TemplateNodeInfoFromNodeGroupTemplate returns a template NodeInfo object based on NodeGroup.TemplateNodeInfo(). The template is sanitized, and only +// contains the pods that should appear on a new Node from the same node group (e.g. DaemonSet pods). +func TemplateNodeInfoFromNodeGroupTemplate(nodeGroup nodeGroupTemplateNodeInfoGetter, daemonsets []*appsv1.DaemonSet, taintConfig taints.TaintConfig) (*framework.NodeInfo, errors.AutoscalerError) { + id := nodeGroup.Id() + baseNodeInfo, err := nodeGroup.TemplateNodeInfo() + if err != nil { + return nil, errors.ToAutoscalerError(errors.CloudProviderError, err) + } + labels.UpdateDeprecatedLabels(baseNodeInfo.Node().ObjectMeta.Labels) + + return TemplateNodeInfoFromExampleNodeInfo(baseNodeInfo, id, daemonsets, true, taintConfig) +} + +// TemplateNodeInfoFromExampleNodeInfo returns a template NodeInfo object based on a real example NodeInfo from the cluster. The template is sanitized, and only +// contains the pods that should appear on a new Node from the same node group (e.g. DaemonSet pods). +func TemplateNodeInfoFromExampleNodeInfo(example *framework.NodeInfo, nodeGroupId string, daemonsets []*appsv1.DaemonSet, forceDaemonSets bool, taintConfig taints.TaintConfig) (*framework.NodeInfo, errors.AutoscalerError) { + randSuffix := fmt.Sprintf("%d", rand.Int63()) + newNodeNameBase := fmt.Sprintf("template-node-for-%s", nodeGroupId) + + // We need to sanitize the example before determining the DS pods, since taints are checked there, and + // we might need to filter some out during sanitization. + sanitizedExample := sanitizeNodeInfo(example, newNodeNameBase, randSuffix, &taintConfig) + expectedPods, err := podsExpectedOnFreshNode(sanitizedExample, daemonsets, forceDaemonSets, randSuffix) + if err != nil { + return nil, err + } + // No need to sanitize the expected pods again - they either come from sanitizedExample and were sanitized above, + // or were added by podsExpectedOnFreshNode and sanitized there. + return framework.NewNodeInfo(sanitizedExample.Node(), nil, expectedPods...), nil +} + +// FreshNodeInfoFromTemplateNodeInfo duplicates the provided template NodeInfo, returning a fresh NodeInfo that can be injected into the cluster snapshot. +// The NodeInfo is sanitized (names, UIDs are changed, etc.), so that it can be injected along other copies created from the same template. +func FreshNodeInfoFromTemplateNodeInfo(template *framework.NodeInfo, suffix string) *framework.NodeInfo { + // Template node infos should already have taints and pods filtered, so not setting these parameters. + return sanitizeNodeInfo(template, template.Node().Name, suffix, nil) +} + +func sanitizeNodeInfo(nodeInfo *framework.NodeInfo, newNodeNameBase string, namesSuffix string, taintConfig *taints.TaintConfig) *framework.NodeInfo { + freshNodeName := fmt.Sprintf("%s-%s", newNodeNameBase, namesSuffix) + freshNode := sanitizeNode(nodeInfo.Node(), freshNodeName, taintConfig) + result := framework.NewNodeInfo(freshNode, nil) + + for _, podInfo := range nodeInfo.Pods() { + freshPod := sanitizePod(podInfo.Pod, freshNode.Name, namesSuffix) + result.AddPod(framework.NewPodInfo(freshPod, nil)) + } + return result +} + +func sanitizeNode(node *apiv1.Node, newName string, taintConfig *taints.TaintConfig) *apiv1.Node { + newNode := node.DeepCopy() + newNode.UID = uuid.NewUUID() + + newNode.Name = newName + if newNode.Labels == nil { + newNode.Labels = make(map[string]string) + } + newNode.Labels[apiv1.LabelHostname] = newName + + if taintConfig != nil { + newNode.Spec.Taints = taints.SanitizeTaints(newNode.Spec.Taints, *taintConfig) + } + return newNode +} + +func sanitizePod(pod *apiv1.Pod, nodeName, nameSuffix string) *apiv1.Pod { + sanitizedPod := pod.DeepCopy() + sanitizedPod.UID = uuid.NewUUID() + sanitizedPod.Name = fmt.Sprintf("%s-%s", pod.Name, nameSuffix) + sanitizedPod.Spec.NodeName = nodeName + return sanitizedPod +} + +func podsExpectedOnFreshNode(sanitizedExampleNodeInfo *framework.NodeInfo, daemonsets []*appsv1.DaemonSet, forceDaemonSets bool, nameSuffix string) ([]*framework.PodInfo, errors.AutoscalerError) { + var result []*framework.PodInfo + runningDS := make(map[types.UID]bool) + for _, pod := range sanitizedExampleNodeInfo.Pods() { + // Ignore scheduled pods in deletion phase + if pod.DeletionTimestamp != nil { + continue + } + // Add scheduled mirror and DS pods + if pod_util.IsMirrorPod(pod.Pod) || pod_util.IsDaemonSetPod(pod.Pod) { + result = append(result, pod) + } + // Mark DS pods as running + controllerRef := metav1.GetControllerOf(pod) + if controllerRef != nil && controllerRef.Kind == "DaemonSet" { + runningDS[controllerRef.UID] = true + } + } + // Add all pending DS pods if force scheduling DS + if forceDaemonSets { + var pendingDS []*appsv1.DaemonSet + for _, ds := range daemonsets { + if !runningDS[ds.UID] { + pendingDS = append(pendingDS, ds) + } + } + // The provided nodeInfo has to have taints properly sanitized, or this won't work correctly. + daemonPods, err := daemonset.GetDaemonSetPodsForNode(sanitizedExampleNodeInfo, pendingDS) + if err != nil { + return nil, errors.ToAutoscalerError(errors.InternalError, err) + } + for _, pod := range daemonPods { + // There's technically no need to sanitize these pods since they're created from scratch, but + // it's nice to have the same suffix for all names in one sanitized NodeInfo when debugging. + result = append(result, &framework.PodInfo{Pod: sanitizePod(pod.Pod, sanitizedExampleNodeInfo.Node().Name, nameSuffix)}) + } + } + return result, nil +} diff --git a/cluster-autoscaler/simulator/node_info_utils_test.go b/cluster-autoscaler/simulator/node_info_utils_test.go new file mode 100644 index 000000000000..00350eb36947 --- /dev/null +++ b/cluster-autoscaler/simulator/node_info_utils_test.go @@ -0,0 +1,510 @@ +/* +Copyright 2024 The Kubernetes Authors. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. +*/ + +package simulator + +import ( + "fmt" + "math/rand" + "strings" + "testing" + "time" + + "github.com/google/go-cmp/cmp" + "github.com/google/go-cmp/cmp/cmpopts" + appsv1 "k8s.io/api/apps/v1" + apiv1 "k8s.io/api/core/v1" + metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" + "k8s.io/apimachinery/pkg/types" + "k8s.io/autoscaler/cluster-autoscaler/config" + "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" + "k8s.io/autoscaler/cluster-autoscaler/utils/errors" + "k8s.io/autoscaler/cluster-autoscaler/utils/taints" + . "k8s.io/autoscaler/cluster-autoscaler/utils/test" + "k8s.io/kubernetes/pkg/controller/daemon" +) + +var ( + ds1 = &appsv1.DaemonSet{ + ObjectMeta: metav1.ObjectMeta{ + Name: "ds1", + Namespace: "ds1-namespace", + UID: types.UID("ds1"), + }, + } + ds2 = &appsv1.DaemonSet{ + ObjectMeta: metav1.ObjectMeta{ + Name: "ds2", + Namespace: "ds2-namespace", + UID: types.UID("ds2"), + }, + } + ds3 = &appsv1.DaemonSet{ + ObjectMeta: metav1.ObjectMeta{ + Name: "ds3", + Namespace: "ds3-namespace", + UID: types.UID("ds3"), + }, + Spec: appsv1.DaemonSetSpec{ + Template: apiv1.PodTemplateSpec{ + Spec: apiv1.PodSpec{ + NodeSelector: map[string]string{"key": "value"}, + }, + }, + }, + } + testDaemonSets = []*appsv1.DaemonSet{ds1, ds2, ds3} +) + +func TestTemplateNodeInfoFromNodeGroupTemplate(t *testing.T) { + exampleNode := BuildTestNode("n", 1000, 10) + exampleNode.Spec.Taints = []apiv1.Taint{ + {Key: taints.ToBeDeletedTaint, Value: "2312532423", Effect: apiv1.TaintEffectNoSchedule}, + } + + for _, tc := range []struct { + testName string + nodeGroup *fakeNodeGroup + + wantPods []*apiv1.Pod + wantCpError bool + }{ + { + testName: "node group error results in an error", + nodeGroup: &fakeNodeGroup{templateNodeInfoErr: fmt.Errorf("test error")}, + wantCpError: true, + }, + { + testName: "simple template with no pods", + nodeGroup: &fakeNodeGroup{ + templateNodeInfoResult: framework.NewNodeInfo(exampleNode, nil), + }, + wantPods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + buildDSPod(ds2, "n"), + }, + }, + { + testName: "template with all kinds of pods", + nodeGroup: &fakeNodeGroup{ + templateNodeInfoResult: framework.NewNodeInfo(exampleNode, nil, + &framework.PodInfo{Pod: BuildScheduledTestPod("p1", 100, 1, "n")}, + &framework.PodInfo{Pod: BuildScheduledTestPod("p2", 100, 1, "n")}, + &framework.PodInfo{Pod: SetMirrorPodSpec(BuildScheduledTestPod("p3", 100, 1, "n"))}, + &framework.PodInfo{Pod: setDeletionTimestamp(SetMirrorPodSpec(BuildScheduledTestPod("p4", 100, 1, "n")))}, + &framework.PodInfo{Pod: buildDSPod(ds1, "n")}, + &framework.PodInfo{Pod: setDeletionTimestamp(buildDSPod(ds2, "n"))}, + ), + }, + wantPods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p3", 100, 1, "n")), + buildDSPod(ds1, "n"), + buildDSPod(ds2, "n"), + }, + }, + } { + t.Run(tc.testName, func(t *testing.T) { + templateNodeInfo, err := TemplateNodeInfoFromNodeGroupTemplate(tc.nodeGroup, testDaemonSets, taints.TaintConfig{}) + if tc.wantCpError { + if err == nil || err.Type() != errors.CloudProviderError { + t.Fatalf("TemplateNodeInfoFromNodeGroupTemplate(): want CloudProviderError, but got: %v (%T)", err, err) + } else { + return + } + } + if err != nil { + t.Fatalf("TemplateNodeInfoFromNodeGroupTemplate(): expected no error, but got %v", err) + } + + // Verify that the taints are correctly sanitized. + // Verify that the NodeInfo is sanitized using the node group id as base. + // Pass empty string as nameSuffix so that it's auto-determined from the sanitized templateNodeInfo, because + // TemplateNodeInfoFromNodeGroupTemplate randomizes the suffix. + // Pass non-empty expectedPods to verify that the set of pods is changed as expected (e.g. DS pods added, non-DS/deleted pods removed). + if err := verifyNodeInfoSanitization(tc.nodeGroup.templateNodeInfoResult, templateNodeInfo, tc.wantPods, "template-node-for-"+tc.nodeGroup.id, "", nil); err != nil { + t.Fatalf("TemplateNodeInfoFromExampleNodeInfo(): NodeInfo wasn't properly sanitized: %v", err) + } + }) + } +} + +func TestTemplateNodeInfoFromExampleNodeInfo(t *testing.T) { + exampleNode := BuildTestNode("n", 1000, 10) + exampleNode.Spec.Taints = []apiv1.Taint{ + {Key: taints.ToBeDeletedTaint, Value: "2312532423", Effect: apiv1.TaintEffectNoSchedule}, + } + + testCases := []struct { + name string + pods []*apiv1.Pod + daemonSets []*appsv1.DaemonSet + forceDS bool + + wantPods []*apiv1.Pod + wantError bool + }{ + { + name: "node without any pods", + }, + { + name: "node with non-DS/mirror pods", + pods: []*apiv1.Pod{ + BuildScheduledTestPod("p1", 100, 1, "n"), + BuildScheduledTestPod("p2", 100, 1, "n"), + }, + wantPods: []*apiv1.Pod{}, + }, + { + name: "node with a mirror pod", + pods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p1", 100, 1, "n")), + }, + wantPods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p1", 100, 1, "n")), + }, + }, + { + name: "node with a deleted mirror pod", + pods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p1", 100, 1, "n")), + setDeletionTimestamp(SetMirrorPodSpec(BuildScheduledTestPod("p2", 100, 1, "n"))), + }, + wantPods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p1", 100, 1, "n")), + }, + }, + { + name: "node with DS pods [forceDS=false, no daemon sets]", + pods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + setDeletionTimestamp(buildDSPod(ds2, "n")), + }, + wantPods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + }, + }, + { + name: "node with DS pods [forceDS=false, some daemon sets]", + pods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + setDeletionTimestamp(buildDSPod(ds2, "n")), + }, + daemonSets: testDaemonSets, + wantPods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + }, + }, + { + name: "node with a DS pod [forceDS=true, no daemon sets]", + pods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + setDeletionTimestamp(buildDSPod(ds2, "n")), + }, + wantPods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + }, + forceDS: true, + }, + { + name: "node with a DS pod [forceDS=true, some daemon sets]", + pods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + setDeletionTimestamp(buildDSPod(ds2, "n")), + }, + daemonSets: testDaemonSets, + forceDS: true, + wantPods: []*apiv1.Pod{ + buildDSPod(ds1, "n"), + buildDSPod(ds2, "n"), + }, + }, + { + name: "everything together [forceDS=false]", + pods: []*apiv1.Pod{ + BuildScheduledTestPod("p1", 100, 1, "n"), + BuildScheduledTestPod("p2", 100, 1, "n"), + SetMirrorPodSpec(BuildScheduledTestPod("p3", 100, 1, "n")), + setDeletionTimestamp(SetMirrorPodSpec(BuildScheduledTestPod("p4", 100, 1, "n"))), + buildDSPod(ds1, "n"), + setDeletionTimestamp(buildDSPod(ds2, "n")), + }, + daemonSets: testDaemonSets, + wantPods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p3", 100, 1, "n")), + buildDSPod(ds1, "n"), + }, + }, + { + name: "everything together [forceDS=true]", + pods: []*apiv1.Pod{ + BuildScheduledTestPod("p1", 100, 1, "n"), + BuildScheduledTestPod("p2", 100, 1, "n"), + SetMirrorPodSpec(BuildScheduledTestPod("p3", 100, 1, "n")), + setDeletionTimestamp(SetMirrorPodSpec(BuildScheduledTestPod("p4", 100, 1, "n"))), + buildDSPod(ds1, "n"), + setDeletionTimestamp(buildDSPod(ds2, "n")), + }, + daemonSets: testDaemonSets, + forceDS: true, + wantPods: []*apiv1.Pod{ + SetMirrorPodSpec(BuildScheduledTestPod("p3", 100, 1, "n")), + buildDSPod(ds1, "n"), + buildDSPod(ds2, "n"), + }, + }, + } + + for _, tc := range testCases { + t.Run(tc.name, func(t *testing.T) { + nodeGroupId := "nodeGroupId" + exampleNodeInfo := framework.NewNodeInfo(exampleNode, nil) + for _, pod := range tc.pods { + exampleNodeInfo.AddPod(&framework.PodInfo{Pod: pod}) + } + + templateNodeInfo, err := TemplateNodeInfoFromExampleNodeInfo(exampleNodeInfo, nodeGroupId, tc.daemonSets, tc.forceDS, taints.TaintConfig{}) + if tc.wantError { + if err == nil { + t.Fatal("TemplateNodeInfoFromExampleNodeInfo(): want error, but got nil") + } else { + return + } + } + if err != nil { + t.Fatalf("TemplateNodeInfoFromExampleNodeInfo(): expected no error, but got %v", err) + } + + // Verify that the taints are correctly sanitized. + // Verify that the NodeInfo is sanitized using the node group id as base. + // Pass empty string as nameSuffix so that it's auto-determined from the sanitized templateNodeInfo, because + // TemplateNodeInfoFromExampleNodeInfo randomizes the suffix. + // Pass non-empty expectedPods to verify that the set of pods is changed as expected (e.g. DS pods added, non-DS/deleted pods removed). + if err := verifyNodeInfoSanitization(exampleNodeInfo, templateNodeInfo, tc.wantPods, "template-node-for-"+nodeGroupId, "", nil); err != nil { + t.Fatalf("TemplateNodeInfoFromExampleNodeInfo(): NodeInfo wasn't properly sanitized: %v", err) + } + }) + } +} + +func TestFreshNodeInfoFromTemplateNodeInfo(t *testing.T) { + nodeName := "template-node" + templateNode := BuildTestNode(nodeName, 1000, 1000) + templateNode.Spec.Taints = []apiv1.Taint{ + {Key: "startup-taint", Value: "true", Effect: apiv1.TaintEffectNoSchedule}, + {Key: taints.ToBeDeletedTaint, Value: "2312532423", Effect: apiv1.TaintEffectNoSchedule}, + {Key: "a", Value: "b", Effect: apiv1.TaintEffectNoSchedule}, + } + pods := []*framework.PodInfo{ + {Pod: BuildTestPod("p1", 80, 0, WithNodeName(nodeName))}, + {Pod: BuildTestPod("p2", 80, 0, WithNodeName(nodeName))}, + } + templateNodeInfo := framework.NewNodeInfo(templateNode, nil, pods...) + + suffix := "abc" + freshNodeInfo := FreshNodeInfoFromTemplateNodeInfo(templateNodeInfo, suffix) + // Verify that the taints are not sanitized (they should be sanitized in the template already). + // Verify that the NodeInfo is sanitized using the template Node name as base. + initialTaints := templateNodeInfo.Node().Spec.Taints + if err := verifyNodeInfoSanitization(templateNodeInfo, freshNodeInfo, nil, templateNodeInfo.Node().Name, suffix, initialTaints); err != nil { + t.Fatalf("FreshNodeInfoFromTemplateNodeInfo(): NodeInfo wasn't properly sanitized: %v", err) + } +} + +func TestSanitizeNodeInfo(t *testing.T) { + oldNodeName := "old-node" + basicNode := BuildTestNode(oldNodeName, 1000, 1000) + + labelsNode := basicNode.DeepCopy() + labelsNode.Labels = map[string]string{ + apiv1.LabelHostname: oldNodeName, + "a": "b", + "x": "y", + } + + taintsNode := basicNode.DeepCopy() + taintsNode.Spec.Taints = []apiv1.Taint{ + {Key: "startup-taint", Value: "true", Effect: apiv1.TaintEffectNoSchedule}, + {Key: taints.ToBeDeletedTaint, Value: "2312532423", Effect: apiv1.TaintEffectNoSchedule}, + {Key: "a", Value: "b", Effect: apiv1.TaintEffectNoSchedule}, + } + taintConfig := taints.NewTaintConfig(config.AutoscalingOptions{StartupTaints: []string{"startup-taint"}}) + + taintsLabelsNode := labelsNode.DeepCopy() + taintsLabelsNode.Spec.Taints = taintsNode.Spec.Taints + + pods := []*framework.PodInfo{ + {Pod: BuildTestPod("p1", 80, 0, WithNodeName(oldNodeName))}, + {Pod: BuildTestPod("p2", 80, 0, WithNodeName(oldNodeName))}, + } + + for _, tc := range []struct { + testName string + + nodeInfo *framework.NodeInfo + taintConfig *taints.TaintConfig + + wantTaints []apiv1.Taint + }{ + { + testName: "sanitize node", + nodeInfo: framework.NewTestNodeInfo(basicNode), + }, + { + testName: "sanitize node labels", + nodeInfo: framework.NewTestNodeInfo(labelsNode), + }, + { + testName: "sanitize node taints - disabled", + nodeInfo: framework.NewTestNodeInfo(taintsNode), + taintConfig: nil, + wantTaints: taintsNode.Spec.Taints, + }, + { + testName: "sanitize node taints - enabled", + nodeInfo: framework.NewTestNodeInfo(taintsNode), + taintConfig: &taintConfig, + wantTaints: []apiv1.Taint{{Key: "a", Value: "b", Effect: apiv1.TaintEffectNoSchedule}}, + }, + { + testName: "sanitize pods", + nodeInfo: framework.NewNodeInfo(basicNode, nil, pods...), + }, + { + testName: "sanitize everything", + nodeInfo: framework.NewNodeInfo(taintsLabelsNode, nil, pods...), + taintConfig: &taintConfig, + wantTaints: []apiv1.Taint{{Key: "a", Value: "b", Effect: apiv1.TaintEffectNoSchedule}}, + }, + } { + t.Run(tc.testName, func(t *testing.T) { + newNameBase := "node" + suffix := "abc" + sanitizedNodeInfo := sanitizeNodeInfo(tc.nodeInfo, newNameBase, suffix, tc.taintConfig) + if err := verifyNodeInfoSanitization(tc.nodeInfo, sanitizedNodeInfo, nil, newNameBase, suffix, tc.wantTaints); err != nil { + t.Fatalf("sanitizeNodeInfo(): NodeInfo wasn't properly sanitized: %v", err) + } + }) + } +} + +// verifyNodeInfoSanitization verifies whether sanitizedNodeInfo was correctly sanitized starting from initialNodeInfo, with the provided +// nameBase and nameSuffix. The expected taints aren't auto-determined, so wantTaints should always be provided. +// +// If nameSuffix is an empty string, the suffix will be determined from sanitizedNodeInfo. This is useful if +// the test doesn't know/control the name suffix (e.g. because it's randomized by the tested function). +// +// If expectedPods is nil, the set of pods is expected not to change between initialNodeInfo and sanitizedNodeInfo. If the sanitization is +// expected to change the set of pods, the expected set should be passed to expectedPods. +func verifyNodeInfoSanitization(initialNodeInfo, sanitizedNodeInfo *framework.NodeInfo, expectedPods []*apiv1.Pod, nameBase, nameSuffix string, wantTaints []apiv1.Taint) error { + if nameSuffix == "" { + // Determine the suffix from the provided sanitized NodeInfo - it should be the last part of a dash-separated name. + nameParts := strings.Split(sanitizedNodeInfo.Node().Name, "-") + if len(nameParts) < 2 { + return fmt.Errorf("sanitized NodeInfo name unexpected: want format -, got %q", sanitizedNodeInfo.Node().Name) + } + nameSuffix = nameParts[len(nameParts)-1] + } + if expectedPods != nil { + // If the sanitization is expected to change the set of pods, hack the initial NodeInfo to have the expected pods. + // Then we can just compare things pod-by-pod as if the set didn't change. + initialNodeInfo = framework.NewNodeInfo(initialNodeInfo.Node(), nil) + for _, pod := range expectedPods { + initialNodeInfo.AddPod(&framework.PodInfo{Pod: pod}) + } + } + + // Verification below assumes the same set of pods between initialNodeInfo and sanitizedNodeInfo. + wantNodeName := fmt.Sprintf("%s-%s", nameBase, nameSuffix) + if gotName := sanitizedNodeInfo.Node().Name; gotName != wantNodeName { + return fmt.Errorf("want sanitized Node name %q, got %q", wantNodeName, gotName) + } + if gotUid, oldUid := sanitizedNodeInfo.Node().UID, initialNodeInfo.Node().UID; gotUid == "" || gotUid == oldUid { + return fmt.Errorf("sanitized Node UID wasn't randomized - got %q, old UID was %q", gotUid, oldUid) + } + wantLabels := make(map[string]string) + for k, v := range initialNodeInfo.Node().Labels { + wantLabels[k] = v + } + wantLabels[apiv1.LabelHostname] = wantNodeName + if diff := cmp.Diff(wantLabels, sanitizedNodeInfo.Node().Labels); diff != "" { + return fmt.Errorf("sanitized Node labels unexpected, diff (-want +got): %s", diff) + } + if diff := cmp.Diff(wantTaints, sanitizedNodeInfo.Node().Spec.Taints); diff != "" { + return fmt.Errorf("sanitized Node taints unexpected, diff (-want +got): %s", diff) + } + if diff := cmp.Diff(initialNodeInfo.Node(), sanitizedNodeInfo.Node(), + cmpopts.IgnoreFields(metav1.ObjectMeta{}, "Name", "Labels", "UID"), + cmpopts.IgnoreFields(apiv1.NodeSpec{}, "Taints"), + ); diff != "" { + return fmt.Errorf("sanitized Node unexpected diff (-want +got): %s", diff) + } + + oldPods := initialNodeInfo.Pods() + newPods := sanitizedNodeInfo.Pods() + if len(oldPods) != len(newPods) { + return fmt.Errorf("want %d pods in sanitized NodeInfo, got %d", len(oldPods), len(newPods)) + } + for i, newPod := range newPods { + oldPod := oldPods[i] + + if newPod.Name == oldPod.Name || !strings.HasSuffix(newPod.Name, nameSuffix) { + return fmt.Errorf("sanitized Pod name unexpected: want (different than %q, ending in %q), got %q", oldPod.Name, nameSuffix, newPod.Name) + } + if gotUid, oldUid := newPod.UID, oldPod.UID; gotUid == "" || gotUid == oldUid { + return fmt.Errorf("sanitized Pod UID wasn't randomized - got %q, old UID was %q", gotUid, oldUid) + } + if gotNodeName := newPod.Spec.NodeName; gotNodeName != wantNodeName { + return fmt.Errorf("want sanitized Pod.Spec.NodeName %q, got %q", wantNodeName, gotNodeName) + } + if diff := cmp.Diff(oldPod, newPod, + cmpopts.IgnoreFields(metav1.ObjectMeta{}, "Name", "UID"), + cmpopts.IgnoreFields(apiv1.PodSpec{}, "NodeName"), + ); diff != "" { + return fmt.Errorf("sanitized Pod unexpected diff (-want +got): %s", diff) + } + } + return nil +} + +func buildDSPod(ds *appsv1.DaemonSet, nodeName string) *apiv1.Pod { + pod := daemon.NewPod(ds, nodeName) + pod.Name = fmt.Sprintf("%s-pod-%d", ds.Name, rand.Int63()) + ptrVal := true + pod.ObjectMeta.OwnerReferences = []metav1.OwnerReference{ + {Kind: "DaemonSet", UID: ds.UID, Name: ds.Name, Controller: &ptrVal}, + } + return pod +} + +func setDeletionTimestamp(pod *apiv1.Pod) *apiv1.Pod { + now := metav1.NewTime(time.Now()) + pod.DeletionTimestamp = &now + return pod +} + +type fakeNodeGroup struct { + id string + templateNodeInfoResult *framework.NodeInfo + templateNodeInfoErr error +} + +func (f *fakeNodeGroup) Id() string { + return f.id +} + +func (f *fakeNodeGroup) TemplateNodeInfo() (*framework.NodeInfo, error) { + return f.templateNodeInfoResult, f.templateNodeInfoErr +} diff --git a/cluster-autoscaler/simulator/nodes.go b/cluster-autoscaler/simulator/nodes.go deleted file mode 100644 index c80fe0cbe092..000000000000 --- a/cluster-autoscaler/simulator/nodes.go +++ /dev/null @@ -1,71 +0,0 @@ -/* -Copyright 2016 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package simulator - -import ( - appsv1 "k8s.io/api/apps/v1" - apiv1 "k8s.io/api/core/v1" - metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" - "k8s.io/apimachinery/pkg/types" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/utils/daemonset" - "k8s.io/autoscaler/cluster-autoscaler/utils/errors" - - pod_util "k8s.io/autoscaler/cluster-autoscaler/utils/pod" -) - -// BuildNodeInfoForNode build a NodeInfo structure for the given node as if the node was just created. -func BuildNodeInfoForNode(node *apiv1.Node, scheduledPods []*apiv1.Pod, daemonsets []*appsv1.DaemonSet, forceDaemonSets bool) (*framework.NodeInfo, errors.AutoscalerError) { - nodeInfo := framework.NewNodeInfo(node, nil) - return addExpectedPods(nodeInfo, scheduledPods, daemonsets, forceDaemonSets) -} - -func addExpectedPods(nodeInfo *framework.NodeInfo, scheduledPods []*apiv1.Pod, daemonsets []*appsv1.DaemonSet, forceDaemonSets bool) (*framework.NodeInfo, errors.AutoscalerError) { - runningDS := make(map[types.UID]bool) - for _, pod := range scheduledPods { - // Ignore scheduled pods in deletion phase - if pod.DeletionTimestamp != nil { - continue - } - // Add scheduled mirror and DS pods - if pod_util.IsMirrorPod(pod) || pod_util.IsDaemonSetPod(pod) { - nodeInfo.AddPod(&framework.PodInfo{Pod: pod}) - } - // Mark DS pods as running - controllerRef := metav1.GetControllerOf(pod) - if controllerRef != nil && controllerRef.Kind == "DaemonSet" { - runningDS[controllerRef.UID] = true - } - } - // Add all pending DS pods if force scheduling DS - if forceDaemonSets { - var pendingDS []*appsv1.DaemonSet - for _, ds := range daemonsets { - if !runningDS[ds.UID] { - pendingDS = append(pendingDS, ds) - } - } - daemonPods, err := daemonset.GetDaemonSetPodsForNode(nodeInfo, pendingDS) - if err != nil { - return nil, errors.ToAutoscalerError(errors.InternalError, err) - } - for _, pod := range daemonPods { - nodeInfo.AddPod(pod) - } - } - return nodeInfo, nil -} diff --git a/cluster-autoscaler/simulator/nodes_test.go b/cluster-autoscaler/simulator/nodes_test.go deleted file mode 100644 index b931979de6cb..000000000000 --- a/cluster-autoscaler/simulator/nodes_test.go +++ /dev/null @@ -1,239 +0,0 @@ -/* -Copyright 2016 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package simulator - -import ( - "strings" - "testing" - "time" - - "github.com/stretchr/testify/assert" - appsv1 "k8s.io/api/apps/v1" - apiv1 "k8s.io/api/core/v1" - metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" - "k8s.io/apimachinery/pkg/types" - "k8s.io/autoscaler/cluster-autoscaler/utils/test" - "k8s.io/kubernetes/pkg/controller/daemon" -) - -func TestBuildNodeInfoForNode(t *testing.T) { - ds1 := &appsv1.DaemonSet{ - ObjectMeta: metav1.ObjectMeta{ - Name: "ds1", - Namespace: "ds1-namespace", - UID: types.UID("ds1"), - }, - } - - ds2 := &appsv1.DaemonSet{ - ObjectMeta: metav1.ObjectMeta{ - Name: "ds2", - Namespace: "ds2-namespace", - UID: types.UID("ds2"), - }, - } - - ds3 := &appsv1.DaemonSet{ - ObjectMeta: metav1.ObjectMeta{ - Name: "ds3", - Namespace: "ds3-namespace", - UID: types.UID("ds3"), - }, - Spec: appsv1.DaemonSetSpec{ - Template: apiv1.PodTemplateSpec{ - Spec: apiv1.PodSpec{ - NodeSelector: map[string]string{"key": "value"}, - }, - }, - }, - } - - testCases := []struct { - name string - node *apiv1.Node - pods []*apiv1.Pod - daemonSets []*appsv1.DaemonSet - forceDS bool - - wantPods []*apiv1.Pod - wantError bool - }{ - { - name: "node without any pods", - node: test.BuildTestNode("n", 1000, 10), - }, - { - name: "node with non-DS/mirror pods", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - test.BuildScheduledTestPod("p1", 100, 1, "n"), - test.BuildScheduledTestPod("p2", 100, 1, "n"), - }, - }, - { - name: "node with a mirror pod", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p1", 100, 1, "n")), - }, - wantPods: []*apiv1.Pod{ - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p1", 100, 1, "n")), - }, - }, - { - name: "node with a deleted mirror pod", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p1", 100, 1, "n")), - setDeletionTimestamp(test.SetMirrorPodSpec(test.BuildScheduledTestPod("p2", 100, 1, "n"))), - }, - wantPods: []*apiv1.Pod{ - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p1", 100, 1, "n")), - }, - }, - { - name: "node with DS pods [forceDS=false, no daemon sets]", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - setDeletionTimestamp(buildDSPod(ds2, "n")), - }, - wantPods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - }, - }, - { - name: "node with DS pods [forceDS=false, some daemon sets]", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - setDeletionTimestamp(buildDSPod(ds2, "n")), - }, - daemonSets: []*appsv1.DaemonSet{ds1, ds2, ds3}, - wantPods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - }, - }, - { - name: "node with a DS pod [forceDS=true, no daemon sets]", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - setDeletionTimestamp(buildDSPod(ds2, "n")), - }, - wantPods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - }, - forceDS: true, - }, - { - name: "node with a DS pod [forceDS=true, some daemon sets]", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - setDeletionTimestamp(buildDSPod(ds2, "n")), - }, - daemonSets: []*appsv1.DaemonSet{ds1, ds2, ds3}, - forceDS: true, - wantPods: []*apiv1.Pod{ - buildDSPod(ds1, "n"), - buildDSPod(ds2, "n"), - }, - }, - { - name: "everything together [forceDS=false]", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - test.BuildScheduledTestPod("p1", 100, 1, "n"), - test.BuildScheduledTestPod("p2", 100, 1, "n"), - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p3", 100, 1, "n")), - setDeletionTimestamp(test.SetMirrorPodSpec(test.BuildScheduledTestPod("p4", 100, 1, "n"))), - buildDSPod(ds1, "n"), - setDeletionTimestamp(buildDSPod(ds2, "n")), - }, - daemonSets: []*appsv1.DaemonSet{ds1, ds2, ds3}, - wantPods: []*apiv1.Pod{ - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p3", 100, 1, "n")), - buildDSPod(ds1, "n"), - }, - }, - { - name: "everything together [forceDS=true]", - node: test.BuildTestNode("n", 1000, 10), - pods: []*apiv1.Pod{ - test.BuildScheduledTestPod("p1", 100, 1, "n"), - test.BuildScheduledTestPod("p2", 100, 1, "n"), - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p3", 100, 1, "n")), - setDeletionTimestamp(test.SetMirrorPodSpec(test.BuildScheduledTestPod("p4", 100, 1, "n"))), - buildDSPod(ds1, "n"), - setDeletionTimestamp(buildDSPod(ds2, "n")), - }, - daemonSets: []*appsv1.DaemonSet{ds1, ds2, ds3}, - forceDS: true, - wantPods: []*apiv1.Pod{ - test.SetMirrorPodSpec(test.BuildScheduledTestPod("p3", 100, 1, "n")), - buildDSPod(ds1, "n"), - buildDSPod(ds2, "n"), - }, - }, - } - - for _, tc := range testCases { - t.Run(tc.name, func(t *testing.T) { - nodeInfo, err := BuildNodeInfoForNode(tc.node, tc.pods, tc.daemonSets, tc.forceDS) - - if tc.wantError { - assert.Error(t, err) - } else { - assert.NoError(t, err) - assert.Equal(t, nodeInfo.Node(), tc.node) - - // clean pod metadata for comparison purposes - var wantPods, pods []*apiv1.Pod - for _, pod := range tc.wantPods { - wantPods = append(wantPods, cleanPodMetadata(pod)) - } - for _, podInfo := range nodeInfo.Pods() { - pods = append(pods, cleanPodMetadata(podInfo.Pod)) - } - assert.ElementsMatch(t, tc.wantPods, pods) - } - }) - } -} - -func cleanPodMetadata(pod *apiv1.Pod) *apiv1.Pod { - pod.Name = strings.Split(pod.Name, "-")[0] - pod.OwnerReferences = nil - return pod -} - -func buildDSPod(ds *appsv1.DaemonSet, nodeName string) *apiv1.Pod { - pod := daemon.NewPod(ds, nodeName) - pod.Name = ds.Name - ptrVal := true - pod.ObjectMeta.OwnerReferences = []metav1.OwnerReference{ - {Kind: "DaemonSet", UID: ds.UID, Controller: &ptrVal}, - } - return pod -} - -func setDeletionTimestamp(pod *apiv1.Pod) *apiv1.Pod { - now := metav1.NewTime(time.Now()) - pod.DeletionTimestamp = &now - return pod -} diff --git a/cluster-autoscaler/simulator/predicatechecker/delegating_shared_lister.go b/cluster-autoscaler/simulator/predicatechecker/delegating_shared_lister.go deleted file mode 100644 index be66bb8bd326..000000000000 --- a/cluster-autoscaler/simulator/predicatechecker/delegating_shared_lister.go +++ /dev/null @@ -1,96 +0,0 @@ -/* -Copyright 2020 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package predicatechecker - -import ( - "fmt" - - schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" -) - -// DelegatingSchedulerSharedLister is an implementation of scheduler.SharedLister which -// passes logic to delegate. Delegate can be updated. -type DelegatingSchedulerSharedLister struct { - delegate schedulerframework.SharedLister -} - -// NewDelegatingSchedulerSharedLister creates new NewDelegatingSchedulerSharedLister -func NewDelegatingSchedulerSharedLister() *DelegatingSchedulerSharedLister { - return &DelegatingSchedulerSharedLister{ - delegate: unsetSharedListerSingleton, - } -} - -// NodeInfos returns a NodeInfoLister. -func (lister *DelegatingSchedulerSharedLister) NodeInfos() schedulerframework.NodeInfoLister { - return lister.delegate.NodeInfos() -} - -// StorageInfos returns a StorageInfoLister -func (lister *DelegatingSchedulerSharedLister) StorageInfos() schedulerframework.StorageInfoLister { - return lister.delegate.StorageInfos() -} - -// UpdateDelegate updates the delegate -func (lister *DelegatingSchedulerSharedLister) UpdateDelegate(delegate schedulerframework.SharedLister) { - lister.delegate = delegate -} - -// ResetDelegate resets delegate to -func (lister *DelegatingSchedulerSharedLister) ResetDelegate() { - lister.delegate = unsetSharedListerSingleton -} - -type unsetSharedLister struct{} -type unsetNodeInfoLister unsetSharedLister -type unsetStorageInfoLister unsetSharedLister - -// List always returns an error -func (lister *unsetNodeInfoLister) List() ([]*schedulerframework.NodeInfo, error) { - return nil, fmt.Errorf("lister not set in delegate") -} - -// HavePodsWithAffinityList always returns an error -func (lister *unsetNodeInfoLister) HavePodsWithAffinityList() ([]*schedulerframework.NodeInfo, error) { - return nil, fmt.Errorf("lister not set in delegate") -} - -// HavePodsWithRequiredAntiAffinityList always returns an error. -func (lister *unsetNodeInfoLister) HavePodsWithRequiredAntiAffinityList() ([]*schedulerframework.NodeInfo, error) { - return nil, fmt.Errorf("lister not set in delegate") -} - -// Get always returns an error -func (lister *unsetNodeInfoLister) Get(nodeName string) (*schedulerframework.NodeInfo, error) { - return nil, fmt.Errorf("lister not set in delegate") -} - -func (lister *unsetStorageInfoLister) IsPVCUsedByPods(key string) bool { - return false -} - -// NodeInfos: Pods returns a fake NodeInfoLister which always returns an error -func (lister *unsetSharedLister) NodeInfos() schedulerframework.NodeInfoLister { - return (*unsetNodeInfoLister)(lister) -} - -// StorageInfos: Pods returns a fake StorageInfoLister which always returns an error -func (lister *unsetSharedLister) StorageInfos() schedulerframework.StorageInfoLister { - return (*unsetStorageInfoLister)(lister) -} - -var unsetSharedListerSingleton *unsetSharedLister diff --git a/cluster-autoscaler/simulator/predicatechecker/error.go b/cluster-autoscaler/simulator/predicatechecker/error.go deleted file mode 100644 index 9e4d6de29d71..000000000000 --- a/cluster-autoscaler/simulator/predicatechecker/error.go +++ /dev/null @@ -1,107 +0,0 @@ -/* -Copyright 2019 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package predicatechecker - -import ( - "fmt" - "strings" -) - -// PredicateErrorType is type of predicate error -type PredicateErrorType int - -const ( - // NotSchedulablePredicateError means that one of the filters returned that pod does not fit a node - NotSchedulablePredicateError PredicateErrorType = iota - // InternalPredicateError denotes internal unexpected error while calling PredicateChecker - InternalPredicateError -) - -// PredicateError is a structure representing error returned from predicate checking simulation. -type PredicateError struct { - errorType PredicateErrorType - predicateName string - errorMessage string - reasons []string - // debugInfo contains additional info that predicate doesn't include, - // but may be useful for debugging (e.g. taints on node blocking scale-up) - debugInfo func() string -} - -// ErrorType returns if error was internal of names predicate failure. -func (pe *PredicateError) ErrorType() PredicateErrorType { - return pe.errorType -} - -// PredicateName return name of predicate which failed. -func (pe *PredicateError) PredicateName() string { - return pe.predicateName -} - -// Message returns error message. -func (pe *PredicateError) Message() string { - if pe.errorMessage == "" { - return "unknown error" - } - return pe.errorMessage -} - -// VerboseMessage generates verbose error message. Building verbose message may be expensive so number of calls should be -// limited. -func (pe *PredicateError) VerboseMessage() string { - return fmt.Sprintf( - "%s; predicateName=%s; reasons: %s; debugInfo=%s", - pe.Message(), - pe.predicateName, - strings.Join(pe.reasons, ", "), - pe.debugInfo()) -} - -// Reasons returns failure reasons from failed predicate as a slice of strings. -func (pe *PredicateError) Reasons() []string { - return pe.reasons -} - -// NewPredicateError creates a new predicate error from error and reasons. -func NewPredicateError( - errorType PredicateErrorType, - predicateName string, - errorMessage string, - reasons []string, - debugInfo func() string, -) *PredicateError { - return &PredicateError{ - errorType: errorType, - predicateName: predicateName, - errorMessage: errorMessage, - reasons: reasons, - debugInfo: debugInfo, - } -} - -// GenericPredicateError return a generic instance of PredicateError to be used in context where predicate name is not -// know. -func GenericPredicateError() *PredicateError { - return &PredicateError{ - errorType: NotSchedulablePredicateError, - errorMessage: "generic predicate failure", - } -} - -func emptyString() string { - return "" -} diff --git a/cluster-autoscaler/simulator/predicatechecker/interface.go b/cluster-autoscaler/simulator/predicatechecker/interface.go deleted file mode 100644 index 2d35b779172c..000000000000 --- a/cluster-autoscaler/simulator/predicatechecker/interface.go +++ /dev/null @@ -1,31 +0,0 @@ -/* -Copyright 2020 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package predicatechecker - -import ( - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - - apiv1 "k8s.io/api/core/v1" -) - -// PredicateChecker checks whether all required predicates pass for given Pod and Node. -type PredicateChecker interface { - FitsAnyNode(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod) (string, error) - FitsAnyNodeMatching(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, nodeMatches func(*framework.NodeInfo) bool) (string, error) - CheckPredicates(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, nodeName string) *PredicateError -} diff --git a/cluster-autoscaler/simulator/predicatechecker/schedulerbased.go b/cluster-autoscaler/simulator/predicatechecker/schedulerbased.go deleted file mode 100644 index 4e37e97528a2..000000000000 --- a/cluster-autoscaler/simulator/predicatechecker/schedulerbased.go +++ /dev/null @@ -1,198 +0,0 @@ -/* -Copyright 2016 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package predicatechecker - -import ( - "context" - "fmt" - - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - - apiv1 "k8s.io/api/core/v1" - "k8s.io/client-go/informers" - v1listers "k8s.io/client-go/listers/core/v1" - klog "k8s.io/klog/v2" - "k8s.io/kubernetes/pkg/scheduler/apis/config" - scheduler_config "k8s.io/kubernetes/pkg/scheduler/apis/config/latest" - schedulerframework "k8s.io/kubernetes/pkg/scheduler/framework" - scheduler_plugins "k8s.io/kubernetes/pkg/scheduler/framework/plugins" - schedulerframeworkruntime "k8s.io/kubernetes/pkg/scheduler/framework/runtime" -) - -// SchedulerBasedPredicateChecker checks whether all required predicates pass for given Pod and Node. -// The verification is done by calling out to scheduler code. -type SchedulerBasedPredicateChecker struct { - framework schedulerframework.Framework - delegatingSharedLister *DelegatingSchedulerSharedLister - nodeLister v1listers.NodeLister - podLister v1listers.PodLister - lastIndex int -} - -// NewSchedulerBasedPredicateChecker builds scheduler based PredicateChecker. -func NewSchedulerBasedPredicateChecker(informerFactory informers.SharedInformerFactory, schedConfig *config.KubeSchedulerConfiguration) (*SchedulerBasedPredicateChecker, error) { - if schedConfig == nil { - var err error - schedConfig, err = scheduler_config.Default() - if err != nil { - return nil, fmt.Errorf("couldn't create scheduler config: %v", err) - } - } - - if len(schedConfig.Profiles) != 1 { - return nil, fmt.Errorf("unexpected scheduler config: expected one scheduler profile only (found %d profiles)", len(schedConfig.Profiles)) - } - sharedLister := NewDelegatingSchedulerSharedLister() - - framework, err := schedulerframeworkruntime.NewFramework( - context.TODO(), - scheduler_plugins.NewInTreeRegistry(), - &schedConfig.Profiles[0], - schedulerframeworkruntime.WithInformerFactory(informerFactory), - schedulerframeworkruntime.WithSnapshotSharedLister(sharedLister), - ) - - if err != nil { - return nil, fmt.Errorf("couldn't create scheduler framework; %v", err) - } - - checker := &SchedulerBasedPredicateChecker{ - framework: framework, - delegatingSharedLister: sharedLister, - } - - return checker, nil -} - -// FitsAnyNode checks if the given pod can be placed on any of the given nodes. -func (p *SchedulerBasedPredicateChecker) FitsAnyNode(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod) (string, error) { - return p.FitsAnyNodeMatching(clusterSnapshot, pod, func(*framework.NodeInfo) bool { - return true - }) -} - -// FitsAnyNodeMatching checks if the given pod can be placed on any of the given nodes matching the provided function. -func (p *SchedulerBasedPredicateChecker) FitsAnyNodeMatching(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, nodeMatches func(*framework.NodeInfo) bool) (string, error) { - if clusterSnapshot == nil { - return "", fmt.Errorf("ClusterSnapshot not provided") - } - - nodeInfosList, err := clusterSnapshot.ListNodeInfos() - if err != nil { - // This should never happen. - // - // Scheduler requires interface returning error, but no implementation - // of ClusterSnapshot ever does it. - klog.Errorf("Error obtaining nodeInfos from schedulerLister") - return "", fmt.Errorf("error obtaining nodeInfos from schedulerLister") - } - - p.delegatingSharedLister.UpdateDelegate(clusterSnapshot) - defer p.delegatingSharedLister.ResetDelegate() - - state := schedulerframework.NewCycleState() - preFilterResult, preFilterStatus, _ := p.framework.RunPreFilterPlugins(context.TODO(), state, pod) - if !preFilterStatus.IsSuccess() { - return "", fmt.Errorf("error running pre filter plugins for pod %s; %s", pod.Name, preFilterStatus.Message()) - } - - for i := range nodeInfosList { - nodeInfo := nodeInfosList[(p.lastIndex+i)%len(nodeInfosList)] - if !nodeMatches(nodeInfo) { - continue - } - - if !preFilterResult.AllNodes() && !preFilterResult.NodeNames.Has(nodeInfo.Node().Name) { - continue - } - - // Be sure that the node is schedulable. - if nodeInfo.Node().Spec.Unschedulable { - continue - } - - filterStatus := p.framework.RunFilterPlugins(context.TODO(), state, pod, nodeInfo.ToScheduler()) - if filterStatus.IsSuccess() { - p.lastIndex = (p.lastIndex + i + 1) % len(nodeInfosList) - return nodeInfo.Node().Name, nil - } - } - return "", fmt.Errorf("cannot put pod %s on any node", pod.Name) -} - -// CheckPredicates checks if the given pod can be placed on the given node. -func (p *SchedulerBasedPredicateChecker) CheckPredicates(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, nodeName string) *PredicateError { - if clusterSnapshot == nil { - return NewPredicateError(InternalPredicateError, "", "ClusterSnapshot not provided", nil, emptyString) - } - nodeInfo, err := clusterSnapshot.GetNodeInfo(nodeName) - if err != nil { - errorMessage := fmt.Sprintf("Error obtaining NodeInfo for name %s; %v", nodeName, err) - return NewPredicateError(InternalPredicateError, "", errorMessage, nil, emptyString) - } - - p.delegatingSharedLister.UpdateDelegate(clusterSnapshot) - defer p.delegatingSharedLister.ResetDelegate() - - state := schedulerframework.NewCycleState() - _, preFilterStatus, _ := p.framework.RunPreFilterPlugins(context.TODO(), state, pod) - if !preFilterStatus.IsSuccess() { - return NewPredicateError( - InternalPredicateError, - "", - preFilterStatus.Message(), - preFilterStatus.Reasons(), - emptyString) - } - - filterStatus := p.framework.RunFilterPlugins(context.TODO(), state, pod, nodeInfo.ToScheduler()) - - if !filterStatus.IsSuccess() { - filterName := filterStatus.Plugin() - filterMessage := filterStatus.Message() - filterReasons := filterStatus.Reasons() - if filterStatus.IsRejected() { - return NewPredicateError( - NotSchedulablePredicateError, - filterName, - filterMessage, - filterReasons, - p.buildDebugInfo(filterName, nodeInfo)) - } - return NewPredicateError( - InternalPredicateError, - filterName, - filterMessage, - filterReasons, - p.buildDebugInfo(filterName, nodeInfo)) - } - - return nil -} - -func (p *SchedulerBasedPredicateChecker) buildDebugInfo(filterName string, nodeInfo *framework.NodeInfo) func() string { - switch filterName { - case "TaintToleration": - taints := nodeInfo.Node().Spec.Taints - return func() string { - return fmt.Sprintf("taints on node: %#v", taints) - } - default: - return emptyString - } -} diff --git a/cluster-autoscaler/simulator/predicatechecker/schedulerbased_test.go b/cluster-autoscaler/simulator/predicatechecker/schedulerbased_test.go deleted file mode 100644 index d5423777f711..000000000000 --- a/cluster-autoscaler/simulator/predicatechecker/schedulerbased_test.go +++ /dev/null @@ -1,322 +0,0 @@ -/* -Copyright 2020 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package predicatechecker - -import ( - "os" - "path/filepath" - "testing" - "time" - - testconfig "k8s.io/autoscaler/cluster-autoscaler/config/test" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" - "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - scheduler "k8s.io/autoscaler/cluster-autoscaler/utils/scheduler" - . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" - - apiv1 "k8s.io/api/core/v1" -) - -func TestCheckPredicate(t *testing.T) { - schedulermetrics.Register() - - p450 := BuildTestPod("p450", 450, 500000) - p600 := BuildTestPod("p600", 600, 500000) - p8000 := BuildTestPod("p8000", 8000, 0) - p500 := BuildTestPod("p500", 500, 500000) - - n1000 := BuildTestNode("n1000", 1000, 2000000) - SetNodeReadyState(n1000, true, time.Time{}) - n1000Unschedulable := BuildTestNode("n1000", 1000, 2000000) - SetNodeReadyState(n1000Unschedulable, true, time.Time{}) - - defaultPredicateChecker, err := NewTestPredicateChecker() - assert.NoError(t, err) - - // temp dir - tmpDir, err := os.MkdirTemp("", "scheduler-configs") - if err != nil { - t.Fatal(err) - } - defer os.RemoveAll(tmpDir) - - customConfigFile := filepath.Join(tmpDir, "custom_config.yaml") - if err := os.WriteFile(customConfigFile, - []byte(testconfig.SchedulerConfigNodeResourcesFitDisabled), - os.FileMode(0600)); err != nil { - t.Fatal(err) - } - - customConfig, err := scheduler.ConfigFromPath(customConfigFile) - assert.NoError(t, err) - customPredicateChecker, err := NewTestPredicateCheckerWithCustomConfig(customConfig) - assert.NoError(t, err) - - tests := []struct { - name string - node *apiv1.Node - scheduledPods []*apiv1.Pod - testPod *apiv1.Pod - predicateChecker PredicateChecker - expectError bool - }{ - // default predicate checker test cases - { - name: "default - other pod - insuficient cpu", - node: n1000, - scheduledPods: []*apiv1.Pod{p450}, - testPod: p600, - expectError: true, - predicateChecker: defaultPredicateChecker, - }, - { - name: "default - other pod - ok", - node: n1000, - scheduledPods: []*apiv1.Pod{p450}, - testPod: p500, - expectError: false, - predicateChecker: defaultPredicateChecker, - }, - { - name: "default - empty - insuficient cpu", - node: n1000, - scheduledPods: []*apiv1.Pod{}, - testPod: p8000, - expectError: true, - predicateChecker: defaultPredicateChecker, - }, - { - name: "default - empty - ok", - node: n1000, - scheduledPods: []*apiv1.Pod{}, - testPod: p600, - expectError: false, - predicateChecker: defaultPredicateChecker, - }, - // custom predicate checker test cases - { - name: "custom - other pod - ok", - node: n1000, - scheduledPods: []*apiv1.Pod{p450}, - testPod: p600, - expectError: false, - predicateChecker: customPredicateChecker, - }, - { - name: "custom -other pod - ok", - node: n1000, - scheduledPods: []*apiv1.Pod{p450}, - testPod: p500, - expectError: false, - predicateChecker: customPredicateChecker, - }, - { - name: "custom -empty - ok", - node: n1000, - scheduledPods: []*apiv1.Pod{}, - testPod: p8000, - expectError: false, - predicateChecker: customPredicateChecker, - }, - { - name: "custom -empty - ok", - node: n1000, - scheduledPods: []*apiv1.Pod{}, - testPod: p600, - expectError: false, - predicateChecker: customPredicateChecker, - }, - } - for _, tt := range tests { - t.Run(tt.name, func(t *testing.T) { - var err error - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - err = clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(tt.node, tt.scheduledPods...)) - assert.NoError(t, err) - - predicateError := tt.predicateChecker.CheckPredicates(clusterSnapshot, tt.testPod, tt.node.Name) - if tt.expectError { - assert.NotNil(t, predicateError) - assert.Equal(t, NotSchedulablePredicateError, predicateError.ErrorType()) - assert.Equal(t, "Insufficient cpu", predicateError.Message()) - assert.Contains(t, predicateError.VerboseMessage(), "Insufficient cpu; predicateName=NodeResourcesFit") - } else { - assert.Nil(t, predicateError) - } - }) - } -} - -func TestFitsAnyNode(t *testing.T) { - p900 := BuildTestPod("p900", 900, 1000) - p1900 := BuildTestPod("p1900", 1900, 1000) - p2100 := BuildTestPod("p2100", 2100, 1000) - - n1000 := BuildTestNode("n1000", 1000, 2000000) - n2000 := BuildTestNode("n2000", 2000, 2000000) - - defaultPredicateChecker, err := NewTestPredicateChecker() - assert.NoError(t, err) - - // temp dir - tmpDir, err := os.MkdirTemp("", "scheduler-configs") - if err != nil { - t.Fatal(err) - } - defer os.RemoveAll(tmpDir) - - customConfigFile := filepath.Join(tmpDir, "custom_config.yaml") - if err := os.WriteFile(customConfigFile, - []byte(testconfig.SchedulerConfigNodeResourcesFitDisabled), - os.FileMode(0600)); err != nil { - t.Fatal(err) - } - - customConfig, err := scheduler.ConfigFromPath(customConfigFile) - assert.NoError(t, err) - customPredicateChecker, err := NewTestPredicateCheckerWithCustomConfig(customConfig) - assert.NoError(t, err) - - testCases := []struct { - name string - predicateChecker PredicateChecker - pod *apiv1.Pod - expectedNodes []string - expectError bool - }{ - // default predicate checker test cases - { - name: "default - small pod - no error", - predicateChecker: defaultPredicateChecker, - pod: p900, - expectedNodes: []string{"n1000", "n2000"}, - expectError: false, - }, - { - name: "default - medium pod - no error", - predicateChecker: defaultPredicateChecker, - pod: p1900, - expectedNodes: []string{"n2000"}, - expectError: false, - }, - { - name: "default - large pod - insufficient cpu", - predicateChecker: defaultPredicateChecker, - pod: p2100, - expectError: true, - }, - - // custom predicate checker test cases - { - name: "custom - small pod - no error", - predicateChecker: customPredicateChecker, - pod: p900, - expectedNodes: []string{"n1000", "n2000"}, - expectError: false, - }, - { - name: "custom - medium pod - no error", - predicateChecker: customPredicateChecker, - pod: p1900, - expectedNodes: []string{"n1000", "n2000"}, - expectError: false, - }, - { - name: "custom - large pod - insufficient cpu", - predicateChecker: customPredicateChecker, - pod: p2100, - expectedNodes: []string{"n1000", "n2000"}, - expectError: false, - }, - } - - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - err = clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(n1000)) - assert.NoError(t, err) - err = clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(n2000)) - assert.NoError(t, err) - - for _, tc := range testCases { - t.Run(tc.name, func(t *testing.T) { - nodeName, err := tc.predicateChecker.FitsAnyNode(clusterSnapshot, tc.pod) - if tc.expectError { - assert.Error(t, err) - } else { - assert.NoError(t, err) - assert.Contains(t, tc.expectedNodes, nodeName) - } - }) - } - -} - -func TestDebugInfo(t *testing.T) { - p1 := BuildTestPod("p1", 0, 0) - node1 := BuildTestNode("n1", 1000, 2000000) - node1.Spec.Taints = []apiv1.Taint{ - { - Key: "SomeTaint", - Value: "WhyNot?", - Effect: apiv1.TaintEffectNoSchedule, - }, - { - Key: "RandomTaint", - Value: "JustBecause", - Effect: apiv1.TaintEffectNoExecute, - }, - } - SetNodeReadyState(node1, true, time.Time{}) - - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - - err := clusterSnapshot.AddNodeInfo(framework.NewTestNodeInfo(node1)) - assert.NoError(t, err) - - // with default predicate checker - defaultPredicateChecker, err := NewTestPredicateChecker() - assert.NoError(t, err) - predicateErr := defaultPredicateChecker.CheckPredicates(clusterSnapshot, p1, "n1") - assert.NotNil(t, predicateErr) - assert.Equal(t, "node(s) had untolerated taint {SomeTaint: WhyNot?}", predicateErr.Message()) - assert.Contains(t, predicateErr.VerboseMessage(), "RandomTaint") - - // with custom predicate checker - - // temp dir - tmpDir, err := os.MkdirTemp("", "scheduler-configs") - if err != nil { - t.Fatal(err) - } - defer os.RemoveAll(tmpDir) - - customConfigFile := filepath.Join(tmpDir, "custom_config.yaml") - if err := os.WriteFile(customConfigFile, - []byte(testconfig.SchedulerConfigTaintTolerationDisabled), - os.FileMode(0600)); err != nil { - t.Fatal(err) - } - - customConfig, err := scheduler.ConfigFromPath(customConfigFile) - assert.NoError(t, err) - customPredicateChecker, err := NewTestPredicateCheckerWithCustomConfig(customConfig) - assert.NoError(t, err) - predicateErr = customPredicateChecker.CheckPredicates(clusterSnapshot, p1, "n1") - assert.Nil(t, predicateErr) -} diff --git a/cluster-autoscaler/simulator/predicatechecker/testchecker.go b/cluster-autoscaler/simulator/predicatechecker/testchecker.go deleted file mode 100644 index dd9e1745acac..000000000000 --- a/cluster-autoscaler/simulator/predicatechecker/testchecker.go +++ /dev/null @@ -1,45 +0,0 @@ -/* -Copyright 2020 The Kubernetes Authors. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. -*/ - -package predicatechecker - -import ( - "k8s.io/client-go/informers" - clientsetfake "k8s.io/client-go/kubernetes/fake" - "k8s.io/kubernetes/pkg/scheduler/apis/config" - scheduler_config_latest "k8s.io/kubernetes/pkg/scheduler/apis/config/latest" -) - -// NewTestPredicateChecker builds test version of PredicateChecker. -func NewTestPredicateChecker() (PredicateChecker, error) { - schedConfig, err := scheduler_config_latest.Default() - if err != nil { - return nil, err - } - - // just call out to NewSchedulerBasedPredicateChecker but use fake kubeClient - return NewSchedulerBasedPredicateChecker(informers.NewSharedInformerFactory(clientsetfake.NewSimpleClientset(), 0), schedConfig) -} - -// NewTestPredicateCheckerWithCustomConfig builds test version of PredicateChecker with custom scheduler config. -func NewTestPredicateCheckerWithCustomConfig(schedConfig *config.KubeSchedulerConfiguration) (PredicateChecker, error) { - if schedConfig != nil { - // just call out to NewSchedulerBasedPredicateChecker but use fake kubeClient - return NewSchedulerBasedPredicateChecker(informers.NewSharedInformerFactory(clientsetfake.NewSimpleClientset(), 0), schedConfig) - } - - return NewTestPredicateChecker() -} diff --git a/cluster-autoscaler/simulator/scheduling/hinting_simulator.go b/cluster-autoscaler/simulator/scheduling/hinting_simulator.go index 2f24bb8bf4ba..0bbf77966e0f 100644 --- a/cluster-autoscaler/simulator/scheduling/hinting_simulator.go +++ b/cluster-autoscaler/simulator/scheduling/hinting_simulator.go @@ -17,11 +17,8 @@ limitations under the License. package scheduling import ( - "fmt" - "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" "k8s.io/autoscaler/cluster-autoscaler/utils/klogx" apiv1 "k8s.io/api/core/v1" @@ -35,15 +32,13 @@ type Status struct { // HintingSimulator is a helper object for simulating scheduler behavior. type HintingSimulator struct { - predicateChecker predicatechecker.PredicateChecker - hints *Hints + hints *Hints } // NewHintingSimulator returns a new HintingSimulator. -func NewHintingSimulator(predicateChecker predicatechecker.PredicateChecker) *HintingSimulator { +func NewHintingSimulator() *HintingSimulator { return &HintingSimulator{ - predicateChecker: predicateChecker, - hints: NewHints(), + hints: NewHints(), } } @@ -62,20 +57,20 @@ func (s *HintingSimulator) TrySchedulePods(clusterSnapshot clustersnapshot.Clust loggingQuota := klogx.PodsLoggingQuota() for _, pod := range pods { klogx.V(5).UpTo(loggingQuota).Infof("Looking for place for %s/%s", pod.Namespace, pod.Name) - nodeName, err := s.findNodeWithHints(clusterSnapshot, pod, isNodeAcceptable) + nodeName, err := s.tryScheduleUsingHints(clusterSnapshot, pod, isNodeAcceptable) if err != nil { return nil, 0, err } if nodeName == "" { - nodeName = s.findNode(similarPods, clusterSnapshot, pod, loggingQuota, isNodeAcceptable) + nodeName, err = s.trySchedule(similarPods, clusterSnapshot, pod, loggingQuota, isNodeAcceptable) + if err != nil { + return nil, 0, err + } } if nodeName != "" { klogx.V(4).UpTo(loggingQuota).Infof("Pod %s/%s can be moved to %s", pod.Namespace, pod.Name, nodeName) - if err := clusterSnapshot.ForceAddPod(pod, nodeName); err != nil { - return nil, 0, fmt.Errorf("simulating scheduling of %s/%s to %s return error; %v", pod.Namespace, pod.Name, nodeName, err) - } statuses = append(statuses, Status{Pod: pod, NodeName: nodeName}) } else if breakOnFailure { break @@ -85,40 +80,45 @@ func (s *HintingSimulator) TrySchedulePods(clusterSnapshot clustersnapshot.Clust return statuses, similarPods.OverflowingControllerCount(), nil } -func (s *HintingSimulator) findNodeWithHints(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, isNodeAcceptable func(*framework.NodeInfo) bool) (string, error) { +func (s *HintingSimulator) tryScheduleUsingHints(clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, isNodeAcceptable func(*framework.NodeInfo) bool) (string, error) { hk := HintKeyFromPod(pod) if hintedNode, hasHint := s.hints.Get(hk); hasHint { - if err := s.predicateChecker.CheckPredicates(clusterSnapshot, pod, hintedNode); err == nil { + nodeInfo, err := clusterSnapshot.GetNodeInfo(hintedNode) + if err != nil { + return "", err + } + if !isNodeAcceptable(nodeInfo) { + return "", nil + } + if err := clusterSnapshot.SchedulePod(pod, hintedNode); err == nil { s.hints.Set(hk, hintedNode) - - nodeInfo, err := clusterSnapshot.GetNodeInfo(hintedNode) - if err != nil { - return "", err - } - - if isNodeAcceptable(nodeInfo) { - return hintedNode, nil - } + return hintedNode, nil + } else if err != nil && err.Type() != clustersnapshot.FailingPredicateError { + // Unexpected error. + return "", err } } return "", nil } -func (s *HintingSimulator) findNode(similarPods *SimilarPodsScheduling, clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, loggingQuota *klogx.Quota, isNodeAcceptable func(*framework.NodeInfo) bool) string { +func (s *HintingSimulator) trySchedule(similarPods *SimilarPodsScheduling, clusterSnapshot clustersnapshot.ClusterSnapshot, pod *apiv1.Pod, loggingQuota *klogx.Quota, isNodeAcceptable func(*framework.NodeInfo) bool) (string, error) { if similarPods.IsSimilarUnschedulable(pod) { klogx.V(4).UpTo(loggingQuota).Infof("failed to find place for %s/%s based on similar pods scheduling", pod.Namespace, pod.Name) - return "" + return "", nil } - newNodeName, err := s.predicateChecker.FitsAnyNodeMatching(clusterSnapshot, pod, isNodeAcceptable) - if err != nil { + newNodeName, err := clusterSnapshot.SchedulePodOnAnyNodeMatching(pod, isNodeAcceptable) + if err != nil && err.Type() == clustersnapshot.NoNodesPassingPredicatesFoundError { klogx.V(4).UpTo(loggingQuota).Infof("failed to find place for %s/%s: %v", pod.Namespace, pod.Name, err) similarPods.SetUnschedulable(pod) - return "" + return "", nil + } else if err != nil { + // Unexpected error. + return "", err } s.hints.Set(HintKeyFromPod(pod), newNodeName) - return newNodeName + return newNodeName, nil } // DropOldHints drops old scheduling hints. diff --git a/cluster-autoscaler/simulator/scheduling/hinting_simulator_test.go b/cluster-autoscaler/simulator/scheduling/hinting_simulator_test.go index 7e3ec8cb3d11..d4b86d256862 100644 --- a/cluster-autoscaler/simulator/scheduling/hinting_simulator_test.go +++ b/cluster-autoscaler/simulator/scheduling/hinting_simulator_test.go @@ -20,19 +20,16 @@ import ( "testing" "time" + "github.com/stretchr/testify/assert" + + apiv1 "k8s.io/api/core/v1" "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot" + "k8s.io/autoscaler/cluster-autoscaler/simulator/clustersnapshot/testsnapshot" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" - "k8s.io/autoscaler/cluster-autoscaler/simulator/predicatechecker" . "k8s.io/autoscaler/cluster-autoscaler/utils/test" - schedulermetrics "k8s.io/kubernetes/pkg/scheduler/metrics" - - "github.com/stretchr/testify/assert" - apiv1 "k8s.io/api/core/v1" ) func TestTrySchedulePods(t *testing.T) { - schedulermetrics.Register() - testCases := []struct { desc string nodes []*apiv1.Node @@ -136,11 +133,9 @@ func TestTrySchedulePods(t *testing.T) { tc := tc t.Run(tc.desc, func(t *testing.T) { t.Parallel() - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(t, err) + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(t) clustersnapshot.InitializeClusterSnapshotOrDie(t, clusterSnapshot, tc.nodes, tc.pods) - s := NewHintingSimulator(predicateChecker) + s := NewHintingSimulator() statuses, _, err := s.TrySchedulePods(clusterSnapshot, tc.newPods, tc.acceptableNodes, false) if tc.wantErr { assert.Error(t, err) @@ -213,16 +208,14 @@ func TestPodSchedulesOnHintedNode(t *testing.T) { tc := tc t.Run(tc.desc, func(t *testing.T) { t.Parallel() - clusterSnapshot := clustersnapshot.NewBasicClusterSnapshot() - predicateChecker, err := predicatechecker.NewTestPredicateChecker() - assert.NoError(t, err) + clusterSnapshot := testsnapshot.NewTestSnapshotOrDie(t) nodes := make([]*apiv1.Node, 0, len(tc.nodeNames)) for _, n := range tc.nodeNames { nodes = append(nodes, buildReadyNode(n, 9999, 9999)) } clustersnapshot.InitializeClusterSnapshotOrDie(t, clusterSnapshot, nodes, []*apiv1.Pod{}) pods := make([]*apiv1.Pod, 0, len(tc.podNodes)) - s := NewHintingSimulator(predicateChecker) + s := NewHintingSimulator() var expectedStatuses []Status for p, n := range tc.podNodes { pod := BuildTestPod(p, 1, 1) diff --git a/cluster-autoscaler/utils/daemonset/daemonset.go b/cluster-autoscaler/utils/daemonset/daemonset.go index 06236ae2443c..dbeab83ad96b 100644 --- a/cluster-autoscaler/utils/daemonset/daemonset.go +++ b/cluster-autoscaler/utils/daemonset/daemonset.go @@ -22,6 +22,7 @@ import ( appsv1 "k8s.io/api/apps/v1" apiv1 "k8s.io/api/core/v1" + metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" "k8s.io/kubernetes/pkg/controller/daemon" ) @@ -40,6 +41,10 @@ func GetDaemonSetPodsForNode(nodeInfo *framework.NodeInfo, daemonsets []*appsv1. if shouldRun { pod := daemon.NewPod(ds, nodeInfo.Node().Name) pod.Name = fmt.Sprintf("%s-pod-%d", ds.Name, rand.Int63()) + ptrVal := true + pod.ObjectMeta.OwnerReferences = []metav1.OwnerReference{ + {Kind: "DaemonSet", UID: ds.UID, Name: ds.Name, Controller: &ptrVal}, + } result = append(result, &framework.PodInfo{Pod: pod}) } } diff --git a/cluster-autoscaler/utils/scheduler/scheduler.go b/cluster-autoscaler/utils/scheduler/scheduler.go index 04a6e99e7af7..c63da3cbf437 100644 --- a/cluster-autoscaler/utils/scheduler/scheduler.go +++ b/cluster-autoscaler/utils/scheduler/scheduler.go @@ -23,7 +23,6 @@ import ( apiv1 "k8s.io/api/core/v1" "k8s.io/apimachinery/pkg/api/resource" - "k8s.io/apimachinery/pkg/util/uuid" "k8s.io/autoscaler/cluster-autoscaler/simulator/framework" scheduler_config "k8s.io/kubernetes/pkg/scheduler/apis/config" scheduler_scheme "k8s.io/kubernetes/pkg/scheduler/apis/config/scheme" @@ -79,27 +78,6 @@ func isHugePageResourceName(name apiv1.ResourceName) bool { return strings.HasPrefix(string(name), apiv1.ResourceHugePagesPrefix) } -// DeepCopyTemplateNode copies NodeInfo object used as a template. It changes -// names of UIDs of both node and pods running on it, so that copies can be used -// to represent multiple nodes. -func DeepCopyTemplateNode(nodeTemplate *framework.NodeInfo, suffix string) *framework.NodeInfo { - node := nodeTemplate.Node().DeepCopy() - node.Name = fmt.Sprintf("%s-%s", node.Name, suffix) - node.UID = uuid.NewUUID() - if node.Labels == nil { - node.Labels = make(map[string]string) - } - node.Labels["kubernetes.io/hostname"] = node.Name - nodeInfo := framework.NewNodeInfo(node, nil) - for _, podInfo := range nodeTemplate.Pods() { - pod := podInfo.Pod.DeepCopy() - pod.Name = fmt.Sprintf("%s-%s", podInfo.Pod.Name, suffix) - pod.UID = uuid.NewUUID() - nodeInfo.AddPod(&framework.PodInfo{Pod: pod}) - } - return nodeInfo -} - // ResourceToResourceList returns a resource list of the resource. func ResourceToResourceList(r *schedulerframework.Resource) apiv1.ResourceList { result := apiv1.ResourceList{