openshift · openshift-merge-robot · Oct 20, 2022 · Oct 18, 2022 · candita · Oct 19, 2022
diff --git a/test/e2e/unmanaged_dns_test.go b/test/e2e/unmanaged_dns_test.go
@@ -5,17 +5,23 @@ package e2e
 
 import (
 	"context"
+	"fmt"
+	"reflect"
 	"testing"
 	"time"
 
+	configv1 "github.com/openshift/api/config/v1"
 	operatorv1 "github.com/openshift/api/operator/v1"
 	iov1 "github.com/openshift/api/operatoringress/v1"
 	"github.com/openshift/cluster-ingress-operator/pkg/operator/controller"
 	ingresscontroller "github.com/openshift/cluster-ingress-operator/pkg/operator/controller/ingress"
+
 	appsv1 "k8s.io/api/apps/v1"
 	corev1 "k8s.io/api/core/v1"
+
 	"k8s.io/apimachinery/pkg/api/errors"
 	"k8s.io/apimachinery/pkg/types"
+	"k8s.io/apimachinery/pkg/util/wait"
 )
 
 // TODO: Remove this once this condition is added to all e2e test
@@ -186,6 +192,23 @@ func TestManagedDNSToUnmanagedDNSIngressController(t *testing.T) {
 func TestUnmanagedDNSToManagedDNSInternalIngressController(t *testing.T) {
 	t.Parallel()
 
+	if infraConfig.Status.PlatformStatus == nil {
+		t.Skip("test skipped on nil platform")
+	}
+	platform := infraConfig.Status.PlatformStatus.Type
+
+	supportedPlatforms := map[configv1.PlatformType]struct{}{
+		configv1.AlibabaCloudPlatformType: {},
+		configv1.AWSPlatformType:          {},
+		configv1.AzurePlatformType:        {},
+		configv1.GCPPlatformType:          {},
+		configv1.IBMCloudPlatformType:     {},
+		configv1.PowerVSPlatformType:      {},
+	}
+	if _, supported := supportedPlatforms[platform]; !supported {
+		t.Skipf("test skipped on platform %q", platform)
+	}
-	supportedPlatforms := map[configv1.PlatformType]struct{}{
-		configv1.AlibabaCloudPlatformType: {},
-		configv1.AWSPlatformType:          {},
-		configv1.AzurePlatformType:        {},
-		configv1.GCPPlatformType:          {},
-		configv1.IBMCloudPlatformType:     {},
-		configv1.PowerVSPlatformType:      {},
-	}
-	if _, supported := supportedPlatforms[platform]; !supported {
-		t.Skipf("test skipped on platform %q", platform)
-	}
+	unsupportedPlatforms := map[configv1.PlatformType]struct{}{
+		configv1.someSpecificPlatformType: {},
+	}
+	if _, unsupported := unsupportedPlatforms[platform]; unsupported {
+		t.Skipf("test skipped on platform %q", platform)
+	}
 func TestAllowedSourceRanges(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 func TestAllowedSourceRangesStatus(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 func TestSourceRangesProgressingAndEvaluationConditionsDetectedStatuses(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 // "LoadBalancerService" endpoint publishing strategy type with scope set to 
 // "Internal" and verifies that the operator creates a load balancer and that 
 // the load balancer has a private IP address. 
 func TestInternalLoadBalancer(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	platform := infraConfig.Status.PlatformStatus.Type 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:          {}, 
 		configv1.AzurePlatformType:        {}, 
 		configv1.GCPPlatformType:          {}, 
 		configv1.IBMCloudPlatformType:     {}, 
 		configv1.AlibabaCloudPlatformType: {}, 
 	} 
 	if _, supported := supportedPlatforms[platform]; !supported { 
 		t.Skipf("test skipped on platform %q", platform) 
 	} 
 func TestInternalLoadBalancerGlobalAccessGCP(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.GCPPlatformType: {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 func TestScopeChange(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	platform := infraConfig.Status.PlatformStatus.Type 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AlibabaCloudPlatformType: {}, 
 		configv1.AWSPlatformType:          {}, 
 		configv1.AzurePlatformType:        {}, 
 		configv1.GCPPlatformType:          {}, 
 		configv1.IBMCloudPlatformType:     {}, 
 		configv1.PowerVSPlatformType:      {}, 
 	} 
 	if _, supported := supportedPlatforms[platform]; !supported { 
 		t.Skipf("test skipped on platform %q", platform) 
 	} 
 func TestLocalWithFallbackOverrideForLoadBalancerService(t *testing.T) { 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
-	supportedPlatforms := map[configv1.PlatformType]struct{}{
-		configv1.AlibabaCloudPlatformType: {},
-		configv1.AWSPlatformType:          {},
-		configv1.AzurePlatformType:        {},
-		configv1.GCPPlatformType:          {},
-		configv1.IBMCloudPlatformType:     {},
-		configv1.PowerVSPlatformType:      {},
-	}
-	if _, supported := supportedPlatforms[platform]; !supported {
-		t.Skipf("test skipped on platform %q", platform)
-	}
+	unsupportedPlatforms := map[configv1.PlatformType]struct{}{
+		configv1.someSpecificPlatformType: {},
+	}
+	if _, unsupported := unsupportedPlatforms[platform]; unsupported {
+		t.Skipf("test skipped on platform %q", platform)
+	}
 func TestAllowedSourceRanges(t *testing.T) { 
 	t.Parallel() 
  
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 func TestAllowedSourceRangesStatus(t *testing.T) { 
 	t.Parallel() 
  
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 func TestSourceRangesProgressingAndEvaluationConditionsDetectedStatuses(t *testing.T) { 
 	t.Parallel() 
  
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 // "LoadBalancerService" endpoint publishing strategy type with scope set to 
 // "Internal" and verifies that the operator creates a load balancer and that 
 // the load balancer has a private IP address. 
 func TestInternalLoadBalancer(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	platform := infraConfig.Status.PlatformStatus.Type 
  
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:          {}, 
 		configv1.AzurePlatformType:        {}, 
 		configv1.GCPPlatformType:          {}, 
 		configv1.IBMCloudPlatformType:     {}, 
 		configv1.AlibabaCloudPlatformType: {}, 
 	} 
 	if _, supported := supportedPlatforms[platform]; !supported { 
 		t.Skipf("test skipped on platform %q", platform) 
 	} 
 func TestInternalLoadBalancerGlobalAccessGCP(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.GCPPlatformType: {}, 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
 func TestScopeChange(t *testing.T) { 
 	t.Parallel() 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	platform := infraConfig.Status.PlatformStatus.Type 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AlibabaCloudPlatformType: {}, 
 		configv1.AWSPlatformType:          {}, 
 		configv1.AzurePlatformType:        {}, 
 		configv1.GCPPlatformType:          {}, 
 		configv1.IBMCloudPlatformType:     {}, 
 		configv1.PowerVSPlatformType:      {}, 
 	} 
 	if _, supported := supportedPlatforms[platform]; !supported { 
 		t.Skipf("test skipped on platform %q", platform) 
 	} 
 func TestLocalWithFallbackOverrideForLoadBalancerService(t *testing.T) { 
 	supportedPlatforms := map[configv1.PlatformType]struct{}{ 
 		configv1.AWSPlatformType:   {}, 
 		configv1.AzurePlatformType: {}, 
 		configv1.GCPPlatformType:   {}, 
 	} 
 	if infraConfig.Status.PlatformStatus == nil { 
 		t.Skip("test skipped on nil platform") 
 	} 
 	if _, supported := supportedPlatforms[infraConfig.Status.PlatformStatus.Type]; !supported { 
 		t.Skipf("test skipped on platform %q", infraConfig.Status.PlatformStatus.Type) 
 	} 
+
 	name := types.NamespacedName{Namespace: operatorNamespace, Name: "unmanaged-migrated-internal"}
 	ic := newLoadBalancerController(name, name.Name+"."+dnsConfig.Spec.BaseDomain)
 	ic.Spec.EndpointPublishingStrategy.LoadBalancer = &operatorv1.LoadBalancerStrategy{
@@ -240,8 +263,35 @@ func TestUnmanagedDNSToManagedDNSInternalIngressController(t *testing.T) {
 		t.Fatalf("failed to update ingresscontroller %s: %v", name, err)
 	}
 
-
+// Wait for the load balancer and DNS to reach stable conditions.
+	if err := waitForIngressControllerCondition(t, kclient, 10*time.Minute, name, append(availableConditionsForIngressControllerWithLoadBalancer, operatorProgressingFalse)...); err != nil {
+		t.Fatalf("failed to observe expected conditions: %v", err)
+	}
-
+// Wait for the load balancer and DNS to reach stable conditions.
+	if err := waitForIngressControllerCondition(t, kclient, 10*time.Minute, name, append(availableConditionsForIngressControllerWithLoadBalancer, operatorProgressingFalse)...); err != nil {
+		t.Fatalf("failed to observe expected conditions: %v", err)
+	}
-	if err := kclient.Delete(context.TODO(), lbService); err != nil && !errors.IsNotFound(err) {
-		t.Fatalf("failed to delete svc %s: %v", lbService.Name, err)
+	var oldLoadBalancerStatus corev1.LoadBalancerStatus
+	lbService.Status.LoadBalancer.DeepCopyInto(&oldLoadBalancerStatus)
+
+	// Only delete the service on platforms that don't automatically update the service's scope.
+	switch platform {
+	case configv1.AlibabaCloudPlatformType, configv1.AWSPlatformType, configv1.IBMCloudPlatformType, configv1.PowerVSPlatformType:
+		if err := kclient.Delete(context.TODO(), lbService); err != nil && !errors.IsNotFound(err) {
+			t.Fatalf("failed to delete svc %s: %v", lbService.Name, err)
+		}
+	}
+
+	// Ensure the service's load-balancer status changes.
+	err := wait.PollImmediate(10*time.Second, 5*time.Minute, func() (bool, error) {
+		lbService := &corev1.Service{}
+		if err := kclient.Get(context.TODO(), controller.LoadBalancerServiceName(ic), lbService); err != nil {
+			t.Logf("Get %q failed: %v, retrying ...", controller.LoadBalancerServiceName(ic), err)
+			return false, nil
+		}
+		if reflect.DeepEqual(lbService.Status.LoadBalancer, oldLoadBalancerStatus) {
+			t.Logf("Waiting for service %q to be updated", controller.LoadBalancerServiceName(ic))
+			return false, nil
+		} else if ingresscontroller.IsServiceInternal(lbService) {
+			// The service got updated, but is not external.
+			return true, fmt.Errorf("load balancer %s is internal but should be external", lbService.Name)
+		}
+		return true, nil
+	})
+	if err != nil {
+		t.Fatalf("error updating the %q service: %v", controller.LoadBalancerServiceName(ic), err)
 	}
 
 	t.Logf("Waiting for stable conditions on ingresscontroller %s after dnsManagementPolicy=Managed", ic.Name)
@@ -251,10 +301,6 @@ func TestUnmanagedDNSToManagedDNSInternalIngressController(t *testing.T) {
 		t.Fatalf("failed to observe expected conditions: %v", err)
 	}
 
-	if !ingresscontroller.IsServiceInternal(lbService) {
-		t.Fatalf("load balancer %s is internal but should be external", lbService.Name)
-	}
-
 	// Ensure DNSRecord CR is present.
 	if err := kclient.Get(context.TODO(), wildcardRecordName, wildcardRecord); err != nil {
 		t.Fatalf("failed to get wildcard dnsrecord %s: %v", wildcardRecordName, err)

diff --git a/test/e2e/util_test.go b/test/e2e/util_test.go
@@ -8,6 +8,7 @@ import (
 	"bytes"
 	"context"
 	"fmt"
+	"net"
 	"net/http"
 	"strings"
 	"testing"
@@ -83,6 +84,7 @@ func waitForHTTPClientCondition(t *testing.T, httpClient *http.Client, req *http
 	return wait.PollImmediate(interval, timeout, func() (done bool, err error) {
 		resp, err := httpClient.Do(req)
 		if err == nil {
+			defer resp.Body.Close()
 			return compareFunc(resp), nil
 		} else {
 			t.Logf("retrying client call due to: %+v", err)
@@ -127,6 +129,7 @@ func buildCurlPod(name, namespace, image, host, address string, extraArgs ...str
 			Namespace: namespace,
 		},
 		Spec: corev1.PodSpec{
+			TerminationGracePeriodSeconds: pointer.Int64(0),
 			Containers: []corev1.Container{
 				{
 					Name:    "curl",
@@ -472,17 +475,31 @@ func verifyExternalIngressController(t *testing.T, name types.NamespacedName, ho
 		}
 	}()
 
+	// If we have a DNS as an external IP address, make sure we can resolve it before moving on.
+	// This just limits the number of "could not resolve host" errors which can be confusing.
+	if net.ParseIP(address) == nil {
+		if err := wait.PollImmediate(10*time.Second, 5*time.Minute, func() (bool, error) {
+			_, err := net.LookupIP(address)
+			if err != nil {
+				t.Logf("waiting for loadbalancer domain %s to resolve...", address)
+				return false, nil
+			}
+			return true, nil
+		}); err != nil {
+			t.Fatalf("loadbalancer domain %s was unable to resolve:", address)
+		}
+	}
+
 	req, err := http.NewRequest(http.MethodGet, fmt.Sprintf("http://%s", address), nil)
 	if err != nil {
 		t.Fatalf("failed to build client request: %v", err)
 	}
-
 	// we use HOST header to map to the domain associated on the ingresscontroller.
 	// This ensures our http call is routed to the correct router.
 	req.Host = hostname
 
 	httpClient := http.Client{Timeout: 5 * time.Second}
-	err = waitForHTTPClientCondition(t, &httpClient, req, 10*time.Second, 5*time.Minute, func(r *http.Response) bool {
+	err = waitForHTTPClientCondition(t, &httpClient, req, 10*time.Second, 10*time.Minute, func(r *http.Response) bool {
 		if r.StatusCode == http.StatusOK {
 			t.Logf("verified connectivity with workload with req %v and response %v", req.URL, r.StatusCode)
 			return true
@@ -545,20 +562,32 @@ func verifyInternalIngressController(t *testing.T, name types.NamespacedName, ho
 		"--retry-delay", "20",
 		"--max-time", "10",
 	}
-	clientPod := buildCurlPod("curl-"+name.Name, echoRoute.Namespace, image, address, echoRoute.Spec.Host, extraArgs...)
+	clientPodName := types.NamespacedName{Namespace: name.Namespace, Name: "curl-" + name.Name}
+	clientPodSpec := buildCurlPod(clientPodName.Name, clientPodName.Namespace, image, address, echoRoute.Spec.Host, extraArgs...)
+	clientPod := clientPodSpec.DeepCopy()
 	if err := kclient.Create(context.TODO(), clientPod); err != nil {
-		t.Fatalf("failed to create pod %s/%s: %v", clientPod.Namespace, clientPod.Name, err)
+		t.Fatalf("failed to create pod %q: %v", clientPodName, err)
 	}
 	defer func() {
 		if err := kclient.Delete(context.TODO(), clientPod); err != nil {
 			if errors.IsNotFound(err) {
 				return
 			}
-			t.Fatalf("failed to delete pod %s/%s: %v", clientPod.Namespace, clientPod.Name, err)
+			t.Fatalf("failed to delete pod %q: %v", clientPodName, err)
 		}
 	}()
 
-	err = wait.PollImmediate(10*time.Second, 5*time.Minute, func() (bool, error) {
+	var curlPodLogs string
+	err = wait.PollImmediate(10*time.Second, 10*time.Minute, func() (bool, error) {
+		if err := kclient.Get(context.TODO(), clientPodName, clientPod); err != nil {
+			t.Logf("error getting client pod %q: %v, retrying...", clientPodName, err)
+			return false, nil
+		}
+		// First check if client curl pod is still starting or not running.
+		if clientPod.Status.Phase == corev1.PodPending {
+			t.Logf("waiting for client pod %q to start", clientPodName)
+			return false, nil
+		}
 		readCloser, err := client.CoreV1().Pods(clientPod.Namespace).GetLogs(clientPod.Name, &corev1.PodLogOptions{
 			Container: "curl",
 			Follow:    false,
@@ -573,16 +602,39 @@ func verifyInternalIngressController(t *testing.T, name types.NamespacedName, ho
 				t.Errorf("failed to close reader for pod %s: %v", clientPod.Name, err)
 			}
 		}()
+		curlPodLogs = ""
 		for scanner.Scan() {
 			line := scanner.Text()
+			curlPodLogs += line + "\n"
 			if strings.Contains(line, "HTTP/1.0 200 OK") {
 				t.Logf("verified connectivity with workload with address: %s with response %s", address, line)
 				return true, nil
 			}
 		}
+		// If failed or succeeded, the pod is stopped, but didn't provide us 200 response, let's try again.
+		if clientPod.Status.Phase == corev1.PodFailed || clientPod.Status.Phase == corev1.PodSucceeded {
+			t.Logf("client pod %q has stopped...restarting. Curl Pod Logs:\n%s", clientPodName, curlPodLogs)
+			if err := kclient.Delete(context.TODO(), clientPod); err != nil && errors.IsNotFound(err) {
+				t.Fatalf("failed to delete pod %q: %v", clientPodName, err)
+			}
+			// Wait for deletion to prevent a race condition. Use PollInfinite since we are already in a Poll.
+			wait.PollInfinite(5*time.Second, func() (bool, error) {
+				err = kclient.Get(context.TODO(), clientPodName, clientPod)
+				if !errors.IsNotFound(err) {
+					t.Logf("waiting for %q: to be deleted", clientPodName)
+					return false, nil
+				}
+				return true, nil
+			})
+			clientPod = clientPodSpec.DeepCopy()
+			if err := kclient.Create(context.TODO(), clientPod); err != nil {
+				t.Fatalf("failed to create pod %q: %v", clientPodName, err)
+			}
+			return false, nil
+		}
 		return false, nil
 	})
 	if err != nil {
-		t.Fatalf("failed to verify connectivity with workload with address: %s using internal curl client: %v", address, err)
+		t.Fatalf("failed to verify connectivity with workload with address: %s using internal curl client. Curl Pod Logs:\n%s", address, curlPodLogs)
 	}
 }