Skip to content

Commit

Permalink
Merge pull request #124849 from gabesaba/gated-fix-1.29
Browse files Browse the repository at this point in the history
cherry pick #124618 to 1.29
  • Loading branch information
k8s-ci-robot authored Jun 4, 2024
2 parents 32a40cc + b66ebe1 commit ac2c0f2
Show file tree
Hide file tree
Showing 4 changed files with 81 additions and 26 deletions.
5 changes: 5 additions & 0 deletions pkg/scheduler/internal/queue/scheduling_queue.go
Original file line number Diff line number Diff line change
Expand Up @@ -1143,6 +1143,11 @@ func (p *PriorityQueue) requeuePodViaQueueingHint(logger klog.Logger, pInfo *fra
func (p *PriorityQueue) movePodsToActiveOrBackoffQueue(logger klog.Logger, podInfoList []*framework.QueuedPodInfo, event framework.ClusterEvent, oldObj, newObj interface{}) {
activated := false
for _, pInfo := range podInfoList {
// Since there may be many gated pods and they will not move from the
// unschedulable pool, we skip calling the expensive isPodWorthRequeueing.
if pInfo.Gated {
continue
}
schedulingHint := p.isPodWorthRequeuing(logger, pInfo, event, oldObj, newObj)
if schedulingHint == queueSkip {
// QueueingHintFn determined that this Pod isn't worth putting to activeQ or backoffQ by this event.
Expand Down
15 changes: 14 additions & 1 deletion pkg/scheduler/internal/queue/scheduling_queue_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -95,6 +95,11 @@ var (
}
)

func setQueuedPodInfoGated(queuedPodInfo *framework.QueuedPodInfo) *framework.QueuedPodInfo {
queuedPodInfo.Gated = true
return queuedPodInfo
}

func getUnschedulablePod(p *PriorityQueue, pod *v1.Pod) *v1.Pod {
pInfo := p.unschedulablePods.get(pod)
if pInfo != nil {
Expand Down Expand Up @@ -1314,6 +1319,14 @@ func TestPriorityQueue_MoveAllToActiveOrBackoffQueueWithQueueingHint(t *testing.
hint: queueHintReturnSkip,
expectedQ: unschedulablePods,
},
{
name: "QueueHintFunction is not called when Pod is gated",
podInfo: setQueuedPodInfoGated(&framework.QueuedPodInfo{PodInfo: mustNewPodInfo(p), UnschedulablePlugins: sets.New("foo")}),
hint: func(logger klog.Logger, pod *v1.Pod, oldObj, newObj interface{}) (framework.QueueingHint, error) {
return framework.Queue, fmt.Errorf("QueueingHintFn should not be called as pod is gated")
},
expectedQ: unschedulablePods,
},
}

for _, test := range tests {
Expand Down Expand Up @@ -2483,7 +2496,7 @@ func TestPendingPodsMetric(t *testing.T) {
gated := makeQueuedPodInfos(total-queueableNum, "y", failme, timestamp)
// Manually mark them as gated=true.
for _, pInfo := range gated {
pInfo.Gated = true
setQueuedPodInfoGated(pInfo)
}
pInfos = append(pInfos, gated...)
totalWithDelay := 20
Expand Down
2 changes: 1 addition & 1 deletion test/integration/scheduler/plugins/plugins_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -2688,7 +2688,7 @@ func TestSchedulingGatesPluginEventsToRegister(t *testing.T) {
{
name: "preEnqueue plugin with event registered",
enqueuePlugin: &SchedulingGatesPluginWithEvents{SchedulingGates: schedulinggates.SchedulingGates{EnablePodSchedulingReadiness: true}},
count: 3,
count: 2,
},
}

Expand Down
85 changes: 61 additions & 24 deletions test/integration/scheduler/queue_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -56,12 +56,13 @@ import (

func TestSchedulingGates(t *testing.T) {
tests := []struct {
name string
pods []*v1.Pod
featureEnabled bool
want []string
rmPodsSchedulingGates []int
wantPostGatesRemoval []string
name string
pods []*v1.Pod
featureEnabled bool
want []string
delete []string
unschedulable []string
rmGates []string
}{
{
name: "feature disabled, regular pods",
Expand Down Expand Up @@ -98,6 +99,7 @@ func TestSchedulingGates(t *testing.T) {
},
featureEnabled: true,
want: []string{"p2"},
unschedulable: []string{"p1"},
},
{
name: "feature enabled, two pod carrying scheduling gates, and remove gates of one pod",
Expand All @@ -106,10 +108,22 @@ func TestSchedulingGates(t *testing.T) {
st.MakePod().Name("p2").SchedulingGates([]string{"bar"}).Container("pause").Obj(),
st.MakePod().Name("p3").Container("pause").Obj(),
},
featureEnabled: true,
want: []string{"p3"},
rmPodsSchedulingGates: []int{1}, // remove gates of 'p2'
wantPostGatesRemoval: []string{"p2"},
featureEnabled: true,
want: []string{"p3"},
unschedulable: []string{"p1", "p2"},
rmGates: []string{"p2"},
},
{
name: "gated pod schedulable after deleting the scheduled pod and removing gate",
pods: []*v1.Pod{
st.MakePod().Name("p1").SchedulingGates([]string{"foo"}).Container("pause").Obj(),
st.MakePod().Name("p2").Container("pause").Obj(),
},
featureEnabled: true,
want: []string{"p2"},
delete: []string{"p2"},
unschedulable: []string{"p1"},
rmGates: []string{"p1"},
},
}

Expand All @@ -130,6 +144,15 @@ func TestSchedulingGates(t *testing.T) {
testutils.SyncSchedulerInformerFactory(testCtx)

cs, ns, ctx := testCtx.ClientSet, testCtx.NS.Name, testCtx.Ctx

// Create node, so we can schedule pods.
node := st.MakeNode().Name("node").Obj()
if _, err := cs.CoreV1().Nodes().Create(ctx, node, metav1.CreateOptions{}); err != nil {
t.Fatal("Failed to create node")

}

// Create pods.
for _, p := range tt.pods {
p.Namespace = ns
if _, err := cs.CoreV1().Pods(ns).Create(ctx, p, metav1.CreateOptions{}); err != nil {
Expand All @@ -145,30 +168,44 @@ func TestSchedulingGates(t *testing.T) {
t.Fatal(err)
}

// Pop the expected pods out. They should be de-queueable.
for _, wantPod := range tt.want {
podInfo := testutils.NextPodOrDie(t, testCtx)
if got := podInfo.Pod.Name; got != wantPod {
t.Errorf("Want %v to be popped out, but got %v", wantPod, got)
go testCtx.Scheduler.Run(ctx)

// Verify pods scheduled.
for _, podName := range tt.want {
if err := wait.PollUntilContextTimeout(ctx, time.Millisecond*200, wait.ForeverTestTimeout, false, testutils.PodScheduled(cs, ns, podName)); err != nil {
t.Fatalf("Failed to schedule %s", podName)
}
}

// Delete pods, which triggers AssignedPodDelete event in the scheduling queue.
for _, podName := range tt.delete {
if err := cs.CoreV1().Pods(ns).Delete(ctx, podName, metav1.DeleteOptions{}); err != nil {
t.Fatalf("Error calling Delete on %s", podName)
}
if err := wait.PollUntilContextTimeout(ctx, time.Millisecond*200, wait.ForeverTestTimeout, false, testutils.PodDeleted(ctx, cs, ns, podName)); err != nil {
t.Fatalf("Failed to delete %s", podName)
}
}

if len(tt.rmPodsSchedulingGates) == 0 {
return
// Verify gated pods unschedulable.
for _, podName := range tt.unschedulable {
if err := wait.PollUntilContextTimeout(ctx, time.Millisecond*200, wait.ForeverTestTimeout, false, testutils.PodSchedulingGated(cs, ns, podName).WithContext()); err != nil {
t.Fatalf("Failed to verify unschedulable %s", podName)
}
}

// Remove scheduling gates from the pod spec.
for _, idx := range tt.rmPodsSchedulingGates {
for _, podName := range tt.rmGates {
patch := `{"spec": {"schedulingGates": null}}`
podName := tt.pods[idx].Name
if _, err := cs.CoreV1().Pods(ns).Patch(ctx, podName, types.StrategicMergePatchType, []byte(patch), metav1.PatchOptions{}); err != nil {
t.Fatalf("Failed to patch pod %v: %v", podName, err)
}
}
// Pop the expected pods out. They should be de-queueable.
for _, wantPod := range tt.wantPostGatesRemoval {
podInfo := testutils.NextPodOrDie(t, testCtx)
if got := podInfo.Pod.Name; got != wantPod {
t.Errorf("Want %v to be popped out, but got %v", wantPod, got)

// Verify pods without gates scheduled.
for _, podName := range tt.rmGates {
if err := wait.PollUntilContextTimeout(ctx, time.Millisecond*200, wait.ForeverTestTimeout, false, testutils.PodScheduled(cs, ns, podName)); err != nil {
t.Fatalf("Failed to schedule %s", podName)
}
}
})
Expand Down

0 comments on commit ac2c0f2

Please sign in to comment.