mirror of
https://github.com/k3s-io/kubernetes.git
synced 2025-07-20 18:31:15 +00:00
Add GracefulNodeShutdown e2e test
This commit is contained in:
parent
0bf274d471
commit
e367d2fe0c
@ -132,6 +132,7 @@ go_test(
|
|||||||
"mirror_pod_test.go",
|
"mirror_pod_test.go",
|
||||||
"node_container_manager_test.go",
|
"node_container_manager_test.go",
|
||||||
"node_perf_test.go",
|
"node_perf_test.go",
|
||||||
|
"node_shutdown_linux_test.go",
|
||||||
"pids_test.go",
|
"pids_test.go",
|
||||||
"pod_hostnamefqdn_test.go",
|
"pod_hostnamefqdn_test.go",
|
||||||
"pods_container_manager_test.go",
|
"pods_container_manager_test.go",
|
||||||
|
228
test/e2e_node/node_shutdown_linux_test.go
Normal file
228
test/e2e_node/node_shutdown_linux_test.go
Normal file
@ -0,0 +1,228 @@
|
|||||||
|
// +build linux
|
||||||
|
|
||||||
|
/*
|
||||||
|
Copyright 2021 The Kubernetes Authors.
|
||||||
|
|
||||||
|
Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
you may not use this file except in compliance with the License.
|
||||||
|
You may obtain a copy of the License at
|
||||||
|
|
||||||
|
http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
|
||||||
|
Unless required by applicable law or agreed to in writing, software
|
||||||
|
distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
See the License for the specific language governing permissions and
|
||||||
|
limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package e2enode
|
||||||
|
|
||||||
|
import (
|
||||||
|
"context"
|
||||||
|
"fmt"
|
||||||
|
"strconv"
|
||||||
|
"time"
|
||||||
|
|
||||||
|
"k8s.io/apimachinery/pkg/fields"
|
||||||
|
|
||||||
|
"github.com/onsi/ginkgo"
|
||||||
|
"github.com/onsi/gomega"
|
||||||
|
v1 "k8s.io/api/core/v1"
|
||||||
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
||||||
|
"k8s.io/kubernetes/pkg/apis/scheduling"
|
||||||
|
"k8s.io/kubernetes/pkg/features"
|
||||||
|
kubeletconfig "k8s.io/kubernetes/pkg/kubelet/apis/config"
|
||||||
|
kubelettypes "k8s.io/kubernetes/pkg/kubelet/types"
|
||||||
|
"k8s.io/kubernetes/test/e2e/framework"
|
||||||
|
)
|
||||||
|
|
||||||
|
var _ = framework.KubeDescribe("GracefulNodeShutdown [Serial] [NodeAlphaFeature:GracefulNodeShutdown]", func() {
|
||||||
|
f := framework.NewDefaultFramework("graceful-node-shutdown")
|
||||||
|
ginkgo.Context("when gracefully shutting down", func() {
|
||||||
|
|
||||||
|
const (
|
||||||
|
pollInterval = 1 * time.Second
|
||||||
|
podStatusUpdateTimeout = 5 * time.Second
|
||||||
|
nodeStatusUpdateTimeout = 10 * time.Second
|
||||||
|
nodeShutdownGracePeriod = 20 * time.Second
|
||||||
|
nodeShutdownGracePeriodCriticalPods = 10 * time.Second
|
||||||
|
)
|
||||||
|
|
||||||
|
tempSetCurrentKubeletConfig(f, func(initialConfig *kubeletconfig.KubeletConfiguration) {
|
||||||
|
initialConfig.FeatureGates = map[string]bool{
|
||||||
|
string(features.GracefulNodeShutdown): true,
|
||||||
|
}
|
||||||
|
initialConfig.ShutdownGracePeriod = metav1.Duration{Duration: nodeShutdownGracePeriod}
|
||||||
|
initialConfig.ShutdownGracePeriodCriticalPods = metav1.Duration{Duration: nodeShutdownGracePeriodCriticalPods}
|
||||||
|
})
|
||||||
|
|
||||||
|
ginkgo.AfterEach(func() {
|
||||||
|
ginkgo.By("Emitting Shutdown false signal; cancelling the shutdown")
|
||||||
|
err := emitSignalPrepareForShutdown(false)
|
||||||
|
framework.ExpectNoError(err)
|
||||||
|
})
|
||||||
|
|
||||||
|
ginkgo.It("should be able to gracefully shutdown pods with various grace periods", func() {
|
||||||
|
nodeName := getNodeName(f)
|
||||||
|
nodeSelector := fields.Set{
|
||||||
|
"spec.nodeName": nodeName,
|
||||||
|
}.AsSelector().String()
|
||||||
|
|
||||||
|
// Define test pods
|
||||||
|
pods := []*v1.Pod{
|
||||||
|
getGracePeriodOverrideTestPod("period-120", nodeName, 120, false),
|
||||||
|
getGracePeriodOverrideTestPod("period-5", nodeName, 5, false),
|
||||||
|
getGracePeriodOverrideTestPod("period-critical-120", nodeName, 120, true),
|
||||||
|
getGracePeriodOverrideTestPod("period-critical-5", nodeName, 5, true),
|
||||||
|
}
|
||||||
|
|
||||||
|
ginkgo.By("Creating batch pods")
|
||||||
|
f.PodClient().CreateBatch(pods)
|
||||||
|
|
||||||
|
list, err := f.PodClient().List(context.TODO(), metav1.ListOptions{
|
||||||
|
FieldSelector: nodeSelector,
|
||||||
|
})
|
||||||
|
framework.ExpectNoError(err)
|
||||||
|
framework.ExpectEqual(len(list.Items), len(pods), "the number of pods is not as expected")
|
||||||
|
|
||||||
|
for _, pod := range list.Items {
|
||||||
|
framework.ExpectEqual(
|
||||||
|
pod.Status.Phase,
|
||||||
|
v1.PodRunning,
|
||||||
|
"pod is not ready",
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
ginkgo.By("Emitting shutdown signal")
|
||||||
|
err = emitSignalPrepareForShutdown(true)
|
||||||
|
framework.ExpectNoError(err)
|
||||||
|
|
||||||
|
// Not critical pod should be shutdown
|
||||||
|
gomega.Eventually(func() error {
|
||||||
|
list, err = f.PodClient().List(context.TODO(), metav1.ListOptions{
|
||||||
|
FieldSelector: nodeSelector,
|
||||||
|
})
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
framework.ExpectEqual(len(list.Items), len(pods), "the number of pods is not as expected")
|
||||||
|
|
||||||
|
for _, pod := range list.Items {
|
||||||
|
if kubelettypes.IsCriticalPod(&pod) {
|
||||||
|
if pod.Status.Phase != v1.PodRunning {
|
||||||
|
return fmt.Errorf("critical pod should not be shutdown, phase: %s", pod.Status.Phase)
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
if pod.Status.Phase != v1.PodFailed || pod.Status.Reason != "Shutdown" {
|
||||||
|
return fmt.Errorf("pod should be shutdown, phase: %s", pod.Status.Phase)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}, podStatusUpdateTimeout, pollInterval).Should(gomega.BeNil())
|
||||||
|
|
||||||
|
// All pod should be shutdown
|
||||||
|
gomega.Eventually(func() error {
|
||||||
|
list, err = f.PodClient().List(context.TODO(), metav1.ListOptions{
|
||||||
|
FieldSelector: nodeSelector,
|
||||||
|
})
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
framework.ExpectEqual(len(list.Items), len(pods), "the number of pods is not as expected")
|
||||||
|
|
||||||
|
for _, pod := range list.Items {
|
||||||
|
if pod.Status.Phase != v1.PodFailed || pod.Status.Reason != "Shutdown" {
|
||||||
|
return fmt.Errorf("pod should be shutdown, phase: %s", pod.Status.Phase)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
},
|
||||||
|
// Critical pod starts shutdown after (nodeShutdownGracePeriod-nodeShutdownGracePeriodCriticalPods)
|
||||||
|
podStatusUpdateTimeout+(nodeShutdownGracePeriod-nodeShutdownGracePeriodCriticalPods),
|
||||||
|
pollInterval).Should(gomega.BeNil())
|
||||||
|
})
|
||||||
|
|
||||||
|
ginkgo.It("should be able to handle a cancelled shutdown", func() {
|
||||||
|
ginkgo.By("Emitting Shutdown signal")
|
||||||
|
err := emitSignalPrepareForShutdown(true)
|
||||||
|
framework.ExpectNoError(err)
|
||||||
|
gomega.Eventually(func() error {
|
||||||
|
isReady := getNodeReadyStatus(f)
|
||||||
|
if isReady {
|
||||||
|
return fmt.Errorf("node did not become shutdown as expected")
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}, nodeStatusUpdateTimeout, pollInterval).Should(gomega.BeNil())
|
||||||
|
|
||||||
|
ginkgo.By("Emitting Shutdown false signal; cancelling the shutdown")
|
||||||
|
err = emitSignalPrepareForShutdown(false)
|
||||||
|
framework.ExpectNoError(err)
|
||||||
|
gomega.Eventually(func() error {
|
||||||
|
isReady := getNodeReadyStatus(f)
|
||||||
|
if !isReady {
|
||||||
|
return fmt.Errorf("node did not recover as expected")
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}, nodeStatusUpdateTimeout, pollInterval).Should(gomega.BeNil())
|
||||||
|
})
|
||||||
|
})
|
||||||
|
})
|
||||||
|
|
||||||
|
func getGracePeriodOverrideTestPod(name string, node string, gracePeriod int64, critical bool) *v1.Pod {
|
||||||
|
pod := &v1.Pod{
|
||||||
|
TypeMeta: metav1.TypeMeta{
|
||||||
|
Kind: "Pod",
|
||||||
|
APIVersion: "v1",
|
||||||
|
},
|
||||||
|
ObjectMeta: metav1.ObjectMeta{
|
||||||
|
Name: name,
|
||||||
|
},
|
||||||
|
Spec: v1.PodSpec{
|
||||||
|
Containers: []v1.Container{
|
||||||
|
{
|
||||||
|
Name: name,
|
||||||
|
Image: busyboxImage,
|
||||||
|
Command: []string{"sh", "-c"},
|
||||||
|
Args: []string{`
|
||||||
|
_term() {
|
||||||
|
echo "Caught SIGTERM signal!"
|
||||||
|
sleep infinity
|
||||||
|
}
|
||||||
|
trap _term SIGTERM
|
||||||
|
sleep infinity
|
||||||
|
`},
|
||||||
|
},
|
||||||
|
},
|
||||||
|
TerminationGracePeriodSeconds: &gracePeriod,
|
||||||
|
NodeName: node,
|
||||||
|
},
|
||||||
|
}
|
||||||
|
if critical {
|
||||||
|
pod.ObjectMeta.Annotations = map[string]string{
|
||||||
|
kubelettypes.ConfigSourceAnnotationKey: kubelettypes.FileSource,
|
||||||
|
}
|
||||||
|
pod.Spec.PriorityClassName = scheduling.SystemNodeCritical
|
||||||
|
|
||||||
|
framework.ExpectEqual(kubelettypes.IsCriticalPod(pod), true, "pod should be a critical pod")
|
||||||
|
} else {
|
||||||
|
framework.ExpectEqual(kubelettypes.IsCriticalPod(pod), false, "pod should not be a critical pod")
|
||||||
|
}
|
||||||
|
return pod
|
||||||
|
}
|
||||||
|
|
||||||
|
// Emits a fake PrepareForShutdown dbus message on system dbus. Will cause kubelet to react to an active shutdown event.
|
||||||
|
func emitSignalPrepareForShutdown(b bool) error {
|
||||||
|
cmd := "gdbus emit --system --object-path /org/freedesktop/login1 --signal org.freedesktop.login1.Manager.PrepareForShutdown " + strconv.FormatBool(b)
|
||||||
|
_, err := runCommand("sh", "-c", cmd)
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
func getNodeReadyStatus(f *framework.Framework) bool {
|
||||||
|
nodeList, err := f.ClientSet.CoreV1().Nodes().List(context.TODO(), metav1.ListOptions{})
|
||||||
|
framework.ExpectNoError(err)
|
||||||
|
// Assuming that there is only one node, because this is a node e2e test.
|
||||||
|
framework.ExpectEqual(len(nodeList.Items), 1)
|
||||||
|
return isNodeReady(&nodeList.Items[0])
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user