Improve eTP:Local NodePort test

It previously assumed that pod-to-other-node-nodeIP would be unmasqueraded, but this is not the case for most network plugins. Use a HostNetwork exec pod to avoid problems. This also requires putting the client and endpoint on different nodes, because with most network plugins, a node-to-same-node-pod connection will end up using the internal "docker0" (or whatever) IP as the source address rather than the node's public IP, and we don't know what that IP is. Also make it work with IPv6.
2025-08-03 17:30:00 +00:00 · 2024-05-08 12:24:11 -04:00 · 2024-05-08 12:24:11 -04:00 · fff883ab4a
commit fff883ab4a
parent 41527afe28
1 changed files with 61 additions and 21 deletions
--- a/test/e2e/network/service.go
+++ b/test/e2e/network/service.go
@ -2693,34 +2693,74 @@ var _ = common.SIGDescribe("Services", func() {
 	})
 	ginkgo.It("should support externalTrafficPolicy=Local for type=NodePort", func(ctx context.Context) {
 		e2eskipper.SkipUnlessNodeCountIsAtLeast(2)
 		namespace := f.Namespace.Name
 		serviceName := "external-local-nodeport"
 		jig := e2eservice.NewTestJig(cs, namespace, serviceName)
-		svc, err := jig.CreateOnlyLocalNodePortService(ctx, true)
+		ginkgo.By("creating the service")
-		framework.ExpectNoError(err)
+		svc, err := jig.CreateOnlyLocalNodePortService(ctx, false)
-		ginkgo.DeferCleanup(func(ctx context.Context) {
+		framework.ExpectNoError(err, "creating the service")
 			err := cs.CoreV1().Services(svc.Namespace).Delete(ctx, svc.Name, metav1.DeleteOptions{})
 			framework.ExpectNoError(err)
 		})
 		tcpNodePort := int(svc.Spec.Ports[0].NodePort)
 		nodePortStr := fmt.Sprintf("%d", tcpNodePort)
 		framework.Logf("NodePort is %s", nodePortStr)
-		endpointsNodeMap, err := getEndpointNodesWithInternalIP(ctx, jig)
+		ginkgo.By("creating a HostNetwork exec pod")
-		framework.ExpectNoError(err)
+		execPod := launchHostExecPod(ctx, cs, namespace, "hostexec")
 		execPod, err = cs.CoreV1().Pods(namespace).Get(ctx, execPod.Name, metav1.GetOptions{})
 		framework.ExpectNoError(err, "getting podIP of execPod")
 		framework.Logf("execPod IP is %q", execPod.Status.PodIP)
-		dialCmd := "clientip"
+		ginkgo.By("creating an endpoint for the service on a different node from the execPod")
-		config := e2enetwork.NewNetworkingTestConfig(ctx, f)
+		_, err = jig.Run(ctx, func(rc *v1.ReplicationController) {
-
+			rc.Spec.Template.Spec.Affinity = &v1.Affinity{
-		for nodeName, nodeIP := range endpointsNodeMap {
+				// We need to ensure the endpoint is on a different node
-			ginkgo.By(fmt.Sprintf("reading clientIP using the TCP service's NodePort, on node %v: %v:%v/%v", nodeName, nodeIP, tcpNodePort, dialCmd))
+				// from the exec pod, to ensure that the source IP of the
-			clientIP, err := GetHTTPContentFromTestContainer(ctx, config, nodeIP, tcpNodePort, e2eservice.KubeProxyLagTimeout, dialCmd)
+				// traffic is the node's "public" IP. For
-			framework.ExpectNoError(err)
+				// node-to-pod-on-same-node traffic, it might end up using
-			framework.Logf("ClientIP detected by target pod using NodePort is %s, the ip of test container is %s", clientIP, config.TestContainerPod.Status.PodIP)
+				// the "docker0" IP or something like that.
-			// the clientIP returned by agnhost contains port
+				NodeAffinity: &v1.NodeAffinity{
-			if !strings.HasPrefix(clientIP, config.TestContainerPod.Status.PodIP) {
+					RequiredDuringSchedulingIgnoredDuringExecution: &v1.NodeSelector{
-				framework.Failf("Source IP was NOT preserved")
+						NodeSelectorTerms: []v1.NodeSelectorTerm{{
 							MatchFields: []v1.NodeSelectorRequirement{{
 								Key:      "metadata.name",
 								Operator: "NotIn",
 								Values:   []string{execPod.Spec.NodeName},
 							}},
 						}},
 					},
 				},
 			}
 		})
 		framework.ExpectNoError(err, "creating the endpoint pod")
 		// Extract the single endpoint node IP from a map of endpoint node IPs
 		var endpointNodeIP string
 		endpointsNodeMap, err := getEndpointNodesWithInternalIP(ctx, jig)
 		framework.ExpectNoError(err, "fetching endpoint node IPs")
 		for node, nodeIP := range endpointsNodeMap {
 			framework.Logf("endpoint is on node %s (%s)", node, nodeIP)
 			endpointNodeIP = nodeIP
 			break
 		}
 		ginkgo.By("connecting from the execpod to the NodePort on the endpoint's node")
 		cmd := fmt.Sprintf("curl -g -q -s --connect-timeout 3 http://%s/clientip", net.JoinHostPort(endpointNodeIP, nodePortStr))
 		var clientIP string
 		err = wait.PollImmediate(framework.Poll, e2eservice.KubeProxyLagTimeout, func() (bool, error) {
 			clientIPPort, err := e2eoutput.RunHostCmd(execPod.Namespace, execPod.Name, cmd)
 			if err != nil {
 				framework.Logf("error connecting: %v", err)
 				return false, nil
 			}
 			clientIP, _, err = net.SplitHostPort(clientIPPort)
 			framework.ExpectNoError(err, "parsing clientip output")
 			return true, nil
 		})
 		framework.ExpectNoError(err, "connecting to nodeport service")
 		if clientIP != execPod.Status.PodIP {
 			framework.Failf("Source IP %s is not the client IP", clientIP)
 		}
 	})
@ -2795,7 +2835,7 @@ var _ = common.SIGDescribe("Services", func() {
 		framework.ExpectNoError(err)
 		// validate that the health check node port from kube-proxy returns 503 when there are no ready endpoints
-		err = wait.PollImmediate(time.Second, time.Minute, func() (bool, error) {
+		err = wait.PollUntilContextTimeout(ctx, time.Second, time.Minute, true, func(ctx context.Context) (bool, error) {
 			cmd := fmt.Sprintf(`curl -s -o /dev/null -w "%%{http_code}" --max-time 5 http://%s/healthz`, healthCheckNodePortAddr)
 			out, err := e2eoutput.RunHostCmd(pausePod0.Namespace, pausePod0.Name, cmd)
 			if err != nil {