1
16
17 package nodeaffinity
18
19 import (
20 "context"
21 "fmt"
22
23 v1 "k8s.io/api/core/v1"
24 metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
25 "k8s.io/apimachinery/pkg/runtime"
26 "k8s.io/apimachinery/pkg/util/sets"
27 "k8s.io/component-helpers/scheduling/corev1/nodeaffinity"
28 "k8s.io/klog/v2"
29 "k8s.io/kubernetes/pkg/scheduler/apis/config"
30 "k8s.io/kubernetes/pkg/scheduler/apis/config/validation"
31 "k8s.io/kubernetes/pkg/scheduler/framework"
32 "k8s.io/kubernetes/pkg/scheduler/framework/plugins/helper"
33 "k8s.io/kubernetes/pkg/scheduler/framework/plugins/names"
34 "k8s.io/kubernetes/pkg/scheduler/util"
35 )
36
37
38 type NodeAffinity struct {
39 handle framework.Handle
40 addedNodeSelector *nodeaffinity.NodeSelector
41 addedPrefSchedTerms *nodeaffinity.PreferredSchedulingTerms
42 }
43
44 var _ framework.PreFilterPlugin = &NodeAffinity{}
45 var _ framework.FilterPlugin = &NodeAffinity{}
46 var _ framework.PreScorePlugin = &NodeAffinity{}
47 var _ framework.ScorePlugin = &NodeAffinity{}
48 var _ framework.EnqueueExtensions = &NodeAffinity{}
49
50 const (
51
52 Name = names.NodeAffinity
53
54
55 preScoreStateKey = "PreScore" + Name
56
57
58 preFilterStateKey = "PreFilter" + Name
59
60
61 ErrReasonPod = "node(s) didn't match Pod's node affinity/selector"
62
63
64 errReasonEnforced = "node(s) didn't match scheduler-enforced node affinity"
65
66
67 errReasonConflict = "pod affinity terms conflict"
68 )
69
70
71 func (pl *NodeAffinity) Name() string {
72 return Name
73 }
74
75 type preFilterState struct {
76 requiredNodeSelectorAndAffinity nodeaffinity.RequiredNodeAffinity
77 }
78
79
80 func (s *preFilterState) Clone() framework.StateData {
81 return s
82 }
83
84
85
86 func (pl *NodeAffinity) EventsToRegister() []framework.ClusterEventWithHint {
87 return []framework.ClusterEventWithHint{
88 {Event: framework.ClusterEvent{Resource: framework.Node, ActionType: framework.Add | framework.Update}, QueueingHintFn: pl.isSchedulableAfterNodeChange},
89 }
90 }
91
92
93
94 func (pl *NodeAffinity) isSchedulableAfterNodeChange(logger klog.Logger, pod *v1.Pod, oldObj, newObj interface{}) (framework.QueueingHint, error) {
95 _, modifiedNode, err := util.As[*v1.Node](oldObj, newObj)
96 if err != nil {
97 return framework.Queue, err
98 }
99
100 if pl.addedNodeSelector != nil && !pl.addedNodeSelector.Match(modifiedNode) {
101 logger.V(4).Info("added or modified node didn't match scheduler-enforced node affinity and this event won't make the Pod schedulable", "pod", klog.KObj(pod), "node", klog.KObj(modifiedNode))
102 return framework.QueueSkip, nil
103 }
104
105 requiredNodeAffinity := nodeaffinity.GetRequiredNodeAffinity(pod)
106 isMatched, err := requiredNodeAffinity.Match(modifiedNode)
107 if err != nil {
108 return framework.Queue, err
109 }
110 if isMatched {
111 logger.V(4).Info("node was created or updated, and matches with the pod's NodeAffinity", "pod", klog.KObj(pod), "node", klog.KObj(modifiedNode))
112 return framework.Queue, nil
113 }
114
115
116
117
118 logger.V(4).Info("node was created or updated, but it doesn't make this pod schedulable", "pod", klog.KObj(pod), "node", klog.KObj(modifiedNode))
119 return framework.QueueSkip, nil
120 }
121
122
123 func (pl *NodeAffinity) PreFilter(ctx context.Context, cycleState *framework.CycleState, pod *v1.Pod) (*framework.PreFilterResult, *framework.Status) {
124 affinity := pod.Spec.Affinity
125 noNodeAffinity := (affinity == nil ||
126 affinity.NodeAffinity == nil ||
127 affinity.NodeAffinity.RequiredDuringSchedulingIgnoredDuringExecution == nil)
128 if noNodeAffinity && pl.addedNodeSelector == nil && pod.Spec.NodeSelector == nil {
129
130 return nil, framework.NewStatus(framework.Skip)
131 }
132
133 state := &preFilterState{requiredNodeSelectorAndAffinity: nodeaffinity.GetRequiredNodeAffinity(pod)}
134 cycleState.Write(preFilterStateKey, state)
135
136 if noNodeAffinity || len(affinity.NodeAffinity.RequiredDuringSchedulingIgnoredDuringExecution.NodeSelectorTerms) == 0 {
137 return nil, nil
138 }
139
140
141 terms := affinity.NodeAffinity.RequiredDuringSchedulingIgnoredDuringExecution.NodeSelectorTerms
142 var nodeNames sets.Set[string]
143 for _, t := range terms {
144 var termNodeNames sets.Set[string]
145 for _, r := range t.MatchFields {
146 if r.Key == metav1.ObjectNameField && r.Operator == v1.NodeSelectorOpIn {
147
148
149 s := sets.New(r.Values...)
150 if termNodeNames == nil {
151 termNodeNames = s
152 } else {
153 termNodeNames = termNodeNames.Intersection(s)
154 }
155 }
156 }
157 if termNodeNames == nil {
158
159
160 return nil, nil
161 }
162 nodeNames = nodeNames.Union(termNodeNames)
163 }
164
165
166 if nodeNames != nil && len(nodeNames) == 0 {
167 return nil, framework.NewStatus(framework.UnschedulableAndUnresolvable, errReasonConflict)
168 } else if len(nodeNames) > 0 {
169 return &framework.PreFilterResult{NodeNames: nodeNames}, nil
170 }
171 return nil, nil
172
173 }
174
175
176 func (pl *NodeAffinity) PreFilterExtensions() framework.PreFilterExtensions {
177 return nil
178 }
179
180
181
182 func (pl *NodeAffinity) Filter(ctx context.Context, state *framework.CycleState, pod *v1.Pod, nodeInfo *framework.NodeInfo) *framework.Status {
183 node := nodeInfo.Node()
184
185 if pl.addedNodeSelector != nil && !pl.addedNodeSelector.Match(node) {
186 return framework.NewStatus(framework.UnschedulableAndUnresolvable, errReasonEnforced)
187 }
188
189 s, err := getPreFilterState(state)
190 if err != nil {
191
192
193 s = &preFilterState{requiredNodeSelectorAndAffinity: nodeaffinity.GetRequiredNodeAffinity(pod)}
194 }
195
196
197 match, _ := s.requiredNodeSelectorAndAffinity.Match(node)
198 if !match {
199 return framework.NewStatus(framework.UnschedulableAndUnresolvable, ErrReasonPod)
200 }
201
202 return nil
203 }
204
205
206 type preScoreState struct {
207 preferredNodeAffinity *nodeaffinity.PreferredSchedulingTerms
208 }
209
210
211
212 func (s *preScoreState) Clone() framework.StateData {
213 return s
214 }
215
216
217 func (pl *NodeAffinity) PreScore(ctx context.Context, cycleState *framework.CycleState, pod *v1.Pod, nodes []*framework.NodeInfo) *framework.Status {
218 if len(nodes) == 0 {
219 return nil
220 }
221 preferredNodeAffinity, err := getPodPreferredNodeAffinity(pod)
222 if err != nil {
223 return framework.AsStatus(err)
224 }
225 if preferredNodeAffinity == nil && pl.addedPrefSchedTerms == nil {
226
227 return framework.NewStatus(framework.Skip)
228 }
229 state := &preScoreState{
230 preferredNodeAffinity: preferredNodeAffinity,
231 }
232 cycleState.Write(preScoreStateKey, state)
233 return nil
234 }
235
236
237
238
239 func (pl *NodeAffinity) Score(ctx context.Context, state *framework.CycleState, pod *v1.Pod, nodeName string) (int64, *framework.Status) {
240 nodeInfo, err := pl.handle.SnapshotSharedLister().NodeInfos().Get(nodeName)
241 if err != nil {
242 return 0, framework.AsStatus(fmt.Errorf("getting node %q from Snapshot: %w", nodeName, err))
243 }
244
245 node := nodeInfo.Node()
246
247 var count int64
248 if pl.addedPrefSchedTerms != nil {
249 count += pl.addedPrefSchedTerms.Score(node)
250 }
251
252 s, err := getPreScoreState(state)
253 if err != nil {
254
255 preferredNodeAffinity, err := getPodPreferredNodeAffinity(pod)
256 if err != nil {
257 return 0, framework.AsStatus(err)
258 }
259 s = &preScoreState{
260 preferredNodeAffinity: preferredNodeAffinity,
261 }
262 }
263
264 if s.preferredNodeAffinity != nil {
265 count += s.preferredNodeAffinity.Score(node)
266 }
267
268 return count, nil
269 }
270
271
272 func (pl *NodeAffinity) NormalizeScore(ctx context.Context, state *framework.CycleState, pod *v1.Pod, scores framework.NodeScoreList) *framework.Status {
273 return helper.DefaultNormalizeScore(framework.MaxNodeScore, false, scores)
274 }
275
276
277 func (pl *NodeAffinity) ScoreExtensions() framework.ScoreExtensions {
278 return pl
279 }
280
281
282 func New(_ context.Context, plArgs runtime.Object, h framework.Handle) (framework.Plugin, error) {
283 args, err := getArgs(plArgs)
284 if err != nil {
285 return nil, err
286 }
287 pl := &NodeAffinity{
288 handle: h,
289 }
290 if args.AddedAffinity != nil {
291 if ns := args.AddedAffinity.RequiredDuringSchedulingIgnoredDuringExecution; ns != nil {
292 pl.addedNodeSelector, err = nodeaffinity.NewNodeSelector(ns)
293 if err != nil {
294 return nil, fmt.Errorf("parsing addedAffinity.requiredDuringSchedulingIgnoredDuringExecution: %w", err)
295 }
296 }
297
298 if terms := args.AddedAffinity.PreferredDuringSchedulingIgnoredDuringExecution; len(terms) != 0 {
299 pl.addedPrefSchedTerms, err = nodeaffinity.NewPreferredSchedulingTerms(terms)
300 if err != nil {
301 return nil, fmt.Errorf("parsing addedAffinity.preferredDuringSchedulingIgnoredDuringExecution: %w", err)
302 }
303 }
304 }
305 return pl, nil
306 }
307
308 func getArgs(obj runtime.Object) (config.NodeAffinityArgs, error) {
309 ptr, ok := obj.(*config.NodeAffinityArgs)
310 if !ok {
311 return config.NodeAffinityArgs{}, fmt.Errorf("args are not of type NodeAffinityArgs, got %T", obj)
312 }
313 return *ptr, validation.ValidateNodeAffinityArgs(nil, ptr)
314 }
315
316 func getPodPreferredNodeAffinity(pod *v1.Pod) (*nodeaffinity.PreferredSchedulingTerms, error) {
317 affinity := pod.Spec.Affinity
318 if affinity != nil && affinity.NodeAffinity != nil && affinity.NodeAffinity.PreferredDuringSchedulingIgnoredDuringExecution != nil {
319 return nodeaffinity.NewPreferredSchedulingTerms(affinity.NodeAffinity.PreferredDuringSchedulingIgnoredDuringExecution)
320 }
321 return nil, nil
322 }
323
324 func getPreScoreState(cycleState *framework.CycleState) (*preScoreState, error) {
325 c, err := cycleState.Read(preScoreStateKey)
326 if err != nil {
327 return nil, fmt.Errorf("reading %q from cycleState: %w", preScoreStateKey, err)
328 }
329
330 s, ok := c.(*preScoreState)
331 if !ok {
332 return nil, fmt.Errorf("invalid PreScore state, got type %T", c)
333 }
334 return s, nil
335 }
336
337 func getPreFilterState(cycleState *framework.CycleState) (*preFilterState, error) {
338 c, err := cycleState.Read(preFilterStateKey)
339 if err != nil {
340 return nil, fmt.Errorf("reading %q from cycleState: %v", preFilterStateKey, err)
341 }
342
343 s, ok := c.(*preFilterState)
344 if !ok {
345 return nil, fmt.Errorf("invalid PreFilter state, got type %T", c)
346 }
347 return s, nil
348 }
349
View as plain text