Merge pull request #86496 from ahg-g/ahg1-check

Support AlwaysCheckAllPredicates in the scheduler framework.
2025-07-28 05:57:25 +00:00 · 2019-12-23 09:53:33 -08:00 · 2019-12-23 09:53:33 -08:00 · 06fb3eb582
commit 06fb3eb582
parent 23864bc09c eeb8a5b728
5 changed files with 109 additions and 34 deletions
--- a/pkg/scheduler/factory.go
+++ b/pkg/scheduler/factory.go
@ -89,6 +89,9 @@ type Configurator struct {
 	// Disable pod preemption or not.
 	disablePreemption bool
 	// Always check all predicates even if the middle of one predicate fails.
 	alwaysCheckAllPredicates bool
 	// percentageOfNodesToScore specifies percentage of all nodes to score in each scheduling cycle.
 	percentageOfNodesToScore int32
@ -202,6 +205,11 @@ func (c *Configurator) CreateFromConfig(policy schedulerapi.Policy) (*Scheduler,
 		c.hardPodAffinitySymmetricWeight = policy.HardPodAffinitySymmetricWeight
 	}
 	// When AlwaysCheckAllPredicates is set to true, scheduler checks all the configured
 	// predicates even after one or more of them fails.
 	if policy.AlwaysCheckAllPredicates {
 		c.alwaysCheckAllPredicates = policy.AlwaysCheckAllPredicates
 	}
 	return c.CreateFromKeys(predicateKeys, priorityKeys, extenders)
 }
@ -250,6 +258,7 @@ func (c *Configurator) CreateFromKeys(predicateKeys, priorityKeys sets.String, e
 		framework.WithClientSet(c.client),
 		framework.WithInformerFactory(c.informerFactory),
 		framework.WithSnapshotSharedLister(c.nodeInfoSnapshot),
 		framework.WithRunAllFilters(c.alwaysCheckAllPredicates),
 	)
 	if err != nil {
 		klog.Fatalf("error initializing the scheduling framework: %v", err)
--- a/pkg/scheduler/framework/v1alpha1/framework.go
+++ b/pkg/scheduler/framework/v1alpha1/framework.go
@ -78,6 +78,10 @@ type framework struct {
 	informerFactory informers.SharedInformerFactory
 	metricsRecorder *metricsRecorder
 	// Indicates that RunFilterPlugins should accumulate all failed statuses and not return
 	// after the first failure.
 	runAllFilters bool
 }
 // extensionPoint encapsulates desired and applied set of plugins at a specific extension
@ -112,6 +116,7 @@ type frameworkOptions struct {
 	informerFactory      informers.SharedInformerFactory
 	snapshotSharedLister schedulerlisters.SharedLister
 	metricsRecorder      *metricsRecorder
 	runAllFilters        bool
 }
 // Option for the framework.
@ -138,6 +143,14 @@ func WithSnapshotSharedLister(snapshotSharedLister schedulerlisters.SharedLister
 	}
 }
 // WithRunAllFilters sets the runAllFilters flag, which means RunFilterPlugins accumulates
 // all failure Statuses.
 func WithRunAllFilters(runAllFilters bool) Option {
 	return func(o *frameworkOptions) {
 		o.runAllFilters = runAllFilters
 	}
 }
 // withMetricsRecorder is only used in tests.
 func withMetricsRecorder(recorder *metricsRecorder) Option {
 	return func(o *frameworkOptions) {
@ -166,6 +179,7 @@ func NewFramework(r Registry, plugins *config.Plugins, args []config.PluginConfi
 		clientSet:             options.clientSet,
 		informerFactory:       options.informerFactory,
 		metricsRecorder:       options.metricsRecorder,
 		runAllFilters:         options.runAllFilters,
 	}
 	if plugins == nil {
 		return f, nil
@ -395,27 +409,37 @@ func (f *framework) RunFilterPlugins(
 	state *CycleState,
 	pod *v1.Pod,
 	nodeInfo *schedulernodeinfo.NodeInfo,
-) (status *Status) {
+) (finalStatus *Status) {
 	if state.ShouldRecordFrameworkMetrics() {
 		startTime := time.Now()
 		defer func() {
-			f.metricsRecorder.observeExtensionPointDurationAsync(filter, status, metrics.SinceInSeconds(startTime))
+			f.metricsRecorder.observeExtensionPointDurationAsync(filter, finalStatus, metrics.SinceInSeconds(startTime))
 		}()
 	}
 	for _, pl := range f.filterPlugins {
-		status = f.runFilterPlugin(ctx, pl, state, pod, nodeInfo)
+		pluginStatus := f.runFilterPlugin(ctx, pl, state, pod, nodeInfo)
-		if !status.IsSuccess() {
+		if !pluginStatus.IsSuccess() {
-			if !status.IsUnschedulable() {
+			if !pluginStatus.IsUnschedulable() {
-				errMsg := fmt.Sprintf("error while running %q filter plugin for pod %q: %v",
+				// Filter plugins are not supposed to return any status other than
-					pl.Name(), pod.Name, status.Message())
+				// Success or Unschedulable.
-				klog.Error(errMsg)
+				return NewStatus(Error, fmt.Sprintf("running %q filter plugin for pod %q: %v", pl.Name(), pod.Name, pluginStatus.Message()))
 				return NewStatus(Error, errMsg)
 			}
-			return status
+			if !f.runAllFilters {
 				// Exit early if we don't need to run all filters.
 				return pluginStatus
 			}
 			// We need to continue and run all filters.
 			if finalStatus.IsSuccess() {
 				// This is the first failed plugin.
 				finalStatus = pluginStatus
 				continue
 			}
 			// We get here only if more than one Filter return unschedulable and runAllFilters is true.
 			finalStatus.reasons = append(finalStatus.reasons, pluginStatus.reasons...)
 		}
 	}
-	return nil
+	return finalStatus
 }
 func (f *framework) runFilterPlugin(ctx context.Context, pl FilterPlugin, state *CycleState, pod *v1.Pod, nodeInfo *schedulernodeinfo.NodeInfo) *Status {
--- a/pkg/scheduler/framework/v1alpha1/framework_test.go
+++ b/pkg/scheduler/framework/v1alpha1/framework_test.go
@ -165,7 +165,7 @@ func (pl *TestPlugin) PreFilterExtensions() PreFilterExtensions {
 }
 func (pl *TestPlugin) Filter(ctx context.Context, state *CycleState, pod *v1.Pod, nodeInfo *schedulernodeinfo.NodeInfo) *Status {
-	return NewStatus(Code(pl.inj.FilterStatus), "injected status")
+	return NewStatus(Code(pl.inj.FilterStatus), "injected filter status")
 }
 func (pl *TestPlugin) PostFilter(ctx context.Context, state *CycleState, pod *v1.Pod, nodes []*v1.Node, filteredNodesStatuses NodeToStatusMap) *Status {
@ -600,7 +600,8 @@ func TestFilterPlugins(t *testing.T) {
 	tests := []struct {
 		name          string
 		plugins       []*TestPlugin
-		wantCode Code
+		wantStatus    *Status
 		runAllFilters bool
 	}{
 		{
 			name: "SuccessFilter",
@ -610,7 +611,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Success)},
 				},
 			},
-			wantCode: Success,
+			wantStatus: nil,
 		},
 		{
 			name: "ErrorFilter",
@ -620,7 +621,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Error)},
 				},
 			},
-			wantCode: Error,
+			wantStatus: NewStatus(Error, `running "TestPlugin" filter plugin for pod "": injected filter status`),
 		},
 		{
 			name: "UnschedulableFilter",
@ -630,7 +631,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Unschedulable)},
 				},
 			},
-			wantCode: Unschedulable,
+			wantStatus: NewStatus(Unschedulable, "injected filter status"),
 		},
 		{
 			name: "UnschedulableAndUnresolvableFilter",
@ -641,7 +642,7 @@ func TestFilterPlugins(t *testing.T) {
 						FilterStatus: int(UnschedulableAndUnresolvable)},
 				},
 			},
-			wantCode: UnschedulableAndUnresolvable,
+			wantStatus: NewStatus(UnschedulableAndUnresolvable, "injected filter status"),
 		},
 		// followings tests cover multiple-plugins scenarios
 		{
@ -657,7 +658,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Error)},
 				},
 			},
-			wantCode: Error,
+			wantStatus: NewStatus(Error, `running "TestPlugin1" filter plugin for pod "": injected filter status`),
 		},
 		{
 			name: "SuccessAndSuccessFilters",
@ -672,7 +673,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Success)},
 				},
 			},
-			wantCode: Success,
+			wantStatus: nil,
 		},
 		{
 			name: "ErrorAndSuccessFilters",
@ -686,7 +687,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Success)},
 				},
 			},
-			wantCode: Error,
+			wantStatus: NewStatus(Error, `running "TestPlugin1" filter plugin for pod "": injected filter status`),
 		},
 		{
 			name: "SuccessAndErrorFilters",
@ -701,7 +702,7 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Error)},
 				},
 			},
-			wantCode: Error,
+			wantStatus: NewStatus(Error, `running "TestPlugin2" filter plugin for pod "": injected filter status`),
 		},
 		{
 			name: "SuccessAndUnschedulableFilters",
@ -716,7 +717,50 @@ func TestFilterPlugins(t *testing.T) {
 					inj:  injectedResult{FilterStatus: int(Unschedulable)},
 				},
 			},
-			wantCode: Unschedulable,
+			wantStatus: NewStatus(Unschedulable, "injected filter status"),
 		},
 		{
 			name: "SuccessFilterWithRunAllFilters",
 			plugins: []*TestPlugin{
 				{
 					name: "TestPlugin",
 					inj:  injectedResult{FilterStatus: int(Success)},
 				},
 			},
 			runAllFilters: true,
 			wantStatus:    nil,
 		},
 		{
 			name: "ErrorAndErrorFilters",
 			plugins: []*TestPlugin{
 				{
 					name: "TestPlugin1",
 					inj:  injectedResult{FilterStatus: int(Error)},
 				},
 				{
 					name: "TestPlugin2",
 					inj:  injectedResult{FilterStatus: int(Error)},
 				},
 			},
 			runAllFilters: true,
 			wantStatus:    NewStatus(Error, `running "TestPlugin1" filter plugin for pod "": injected filter status`),
 		},
 		{
 			name: "ErrorAndErrorFilters",
 			plugins: []*TestPlugin{
 				{
 					name: "TestPlugin1",
 					inj:  injectedResult{FilterStatus: int(UnschedulableAndUnresolvable)},
 				},
 				{
 					name: "TestPlugin2",
 					inj:  injectedResult{FilterStatus: int(Unschedulable)},
 				},
 			},
 			runAllFilters: true,
 			wantStatus:    NewStatus(UnschedulableAndUnresolvable, "injected filter status", "injected filter status"),
 		},
 	}
@ -739,13 +783,13 @@ func TestFilterPlugins(t *testing.T) {
 					config.Plugin{Name: pl.name})
 			}
-			f, err := NewFramework(registry, cfgPls, emptyArgs)
+			f, err := NewFramework(registry, cfgPls, emptyArgs, WithRunAllFilters(tt.runAllFilters))
 			if err != nil {
 				t.Fatalf("fail to create framework: %s", err)
 			}
 			status := f.RunFilterPlugins(context.TODO(), nil, pod, nil)
-			if status.Code() != tt.wantCode {
+			if !reflect.DeepEqual(status, tt.wantStatus) {
-				t.Errorf("Wrong status code. got: %v, want:%v", status.Code(), tt.wantCode)
+				t.Errorf("Wrong status code. got: %v, want:%v", status, tt.wantStatus)
 			}
 		})
 	}
--- a/pkg/scheduler/framework/v1alpha1/interface.go
+++ b/pkg/scheduler/framework/v1alpha1/interface.go
@ -384,12 +384,10 @@ type Framework interface {
 	RunPreFilterPlugins(ctx context.Context, state *CycleState, pod *v1.Pod) *Status
 	// RunFilterPlugins runs the set of configured filter plugins for pod on
-	// the given node. It returns directly if any of the filter plugins
+	// the given node. Note that for the node being evaluated, the passed nodeInfo
-	// return any status other than "Success". Note that for the node being
+	// reference could be different from the one in NodeInfoSnapshot map (e.g., pods
-	// evaluated, the passed nodeInfo reference could be different from the
+	// considered to be running on the node could be different). For example, during
-	// one in NodeInfoSnapshot map (e.g., pods considered to be running on
+	// preemption, we may pass a copy of the original nodeInfo object that has some pods
 	// the node could be different). For example, during preemption, we may
 	// pass a copy of the original nodeInfo object that has some pods
 	// removed from it to evaluate the possibility of preempting them to
 	// schedule the target pod.
 	RunFilterPlugins(ctx context.Context, state *CycleState, pod *v1.Pod, nodeInfo *schedulernodeinfo.NodeInfo) *Status
--- a/pkg/scheduler/scheduler_test.go
+++ b/pkg/scheduler/scheduler_test.go
@ -890,7 +890,7 @@ func TestSchedulerWithVolumeBinding(t *testing.T) {
 				FindErr: findErr,
 			},
 			eventReason: "FailedScheduling",
-			expectError: fmt.Errorf("error while running %q filter plugin for pod %q: %v", volumebinding.Name, "foo", findErr),
+			expectError: fmt.Errorf("running %q filter plugin for pod %q: %v", volumebinding.Name, "foo", findErr),
 		},
 		{
 			name: "assume error",