openshift · openshift-merge-bot · Aug 8, 2025 · Jul 25, 2025 · Jul 25, 2025 · Jul 30, 2025
diff --git a/pkg/cmd/openshift-tests/monitor/run/run_monitor_command.go b/pkg/cmd/openshift-tests/monitor/run/run_monitor_command.go
@@ -13,6 +13,7 @@ import (
 
 	"github.com/openshift/origin/pkg/clioptions/imagesetup"
 	"github.com/openshift/origin/pkg/monitortestframework"
+	exutil "github.com/openshift/origin/test/extended/util"
 
 	"github.com/openshift/origin/pkg/monitor/monitorapi"
 	"github.com/openshift/origin/test/extended/util/image"
@@ -92,6 +93,9 @@ func (f *RunMonitorFlags) BindFlags(flags *pflag.FlagSet) {
 }
 
 func (f *RunMonitorFlags) ToOptions() (*RunMonitorOptions, error) {
+	// This is to set testsStarted = true to avoid panic
+	exutil.WithCleanup(func() {})
+
 	var displayFilterFn monitorapi.EventIntervalMatchesFunc
 	if f.DisplayFromNow {
 		now := time.Now()

diff --git a/pkg/defaultmonitortests/types.go b/pkg/defaultmonitortests/types.go
@@ -6,6 +6,7 @@ import (
 	"github.com/openshift/origin/pkg/monitortestframework"
 	"github.com/openshift/origin/pkg/monitortests/authentication/legacyauthenticationmonitortests"
 	"github.com/openshift/origin/pkg/monitortests/authentication/requiredsccmonitortests"
+	admupgradestatus "github.com/openshift/origin/pkg/monitortests/cli/adm_upgrade/status"
 	azuremetrics "github.com/openshift/origin/pkg/monitortests/cloud/azure/metrics"
 	"github.com/openshift/origin/pkg/monitortests/clusterversionoperator/legacycvomonitortests"
 	"github.com/openshift/origin/pkg/monitortests/clusterversionoperator/operatorstateanalyzer"
@@ -207,5 +208,7 @@ func newUniversalMonitorTests(info monitortestframework.MonitorTestInitializatio
 	monitorTestRegistry.AddMonitorTestOrDie("watch-namespaces", "Test Framework", watchnamespaces.NewNamespaceWatcher())
 	monitorTestRegistry.AddMonitorTestOrDie("high-cpu-test-analyzer", "Test Framework", highcputestanalyzer.NewHighCPUTestAnalyzer())
 
+	monitorTestRegistry.AddMonitorTestOrDie("oc-adm-upgrade-status", "oc / update", admupgradestatus.NewOcAdmUpgradeStatusChecker())
+
 	return monitorTestRegistry
 }
diff --git a/pkg/monitortests/cli/adm_upgrade/OWNERS b/pkg/monitortests/cli/adm_upgrade/OWNERS
@@ -0,0 +1,6 @@
+# See the OWNERS docs: https://git.k8s.io/community/contributors/guide/owners.md
+
+approvers:
+- cluster-version-operator-test-case-approvers
+reviewers:
+- cluster-version-operator-test-case-reviewers
diff --git a/pkg/monitortests/cli/adm_upgrade/status/monitortest.go b/pkg/monitortests/cli/adm_upgrade/status/monitortest.go
@@ -0,0 +1,193 @@
+package admupgradestatus
+
+import (
+	"context"
+	"fmt"
+	"os"
+	"path"
+	"path/filepath"
+	"strings"
+	"time"
+
+	clientconfigv1 "github.com/openshift/client-go/config/clientset/versioned"
+	"github.com/openshift/origin/pkg/monitortestframework"
+	exutil "github.com/openshift/origin/test/extended/util"
+	"k8s.io/apimachinery/pkg/util/errors"
+	"k8s.io/apimachinery/pkg/util/wait"
+	"k8s.io/client-go/kubernetes"
+	"k8s.io/client-go/rest"
+
+	"github.com/openshift/origin/pkg/monitor/monitorapi"
+	"github.com/openshift/origin/pkg/test/ginkgo/junitapi"
+)
+
+type snapshot struct {
+	when time.Time
+	out  string
+	err  error
+}
+type monitor struct {
+	collectionDone     chan struct{}
+	ocAdmUpgradeStatus map[time.Time]*snapshot
+	notSupportedReason error
+	isSNO              bool
+}
+
+func NewOcAdmUpgradeStatusChecker() monitortestframework.MonitorTest {
+	return &monitor{
+		collectionDone:     make(chan struct{}),
+		ocAdmUpgradeStatus: map[time.Time]*snapshot{},
+	}
+}
+
+func (w *monitor) PrepareCollection(ctx context.Context, adminRESTConfig *rest.Config, recorder monitorapi.RecorderWriter) error {
+	kubeClient, err := kubernetes.NewForConfig(adminRESTConfig)
+	if err != nil {
+		return err
+	}
+	isMicroShift, err := exutil.IsMicroShiftCluster(kubeClient)
+	if err != nil {
+		return fmt.Errorf("unable to determine if cluster is MicroShift: %v", err)
+	}
+	if isMicroShift {
+		w.notSupportedReason = &monitortestframework.NotSupportedError{Reason: "platform MicroShift not supported"}
+		return w.notSupportedReason
+	}
+	clientconfigv1client, err := clientconfigv1.NewForConfig(adminRESTConfig)
+	if err != nil {
+		return err
+	}
+
+	if ok, err := exutil.IsHypershift(ctx, clientconfigv1client); err != nil {
+		return fmt.Errorf("unable to determine if cluster is Hypershift: %v", err)
+	} else if ok {
+		w.notSupportedReason = &monitortestframework.NotSupportedError{Reason: "platform Hypershift not supported"}
+		return w.notSupportedReason
+	}
+
+	if ok, err := exutil.IsSingleNode(ctx, clientconfigv1client); err != nil {
+		return fmt.Errorf("unable to determine if cluster is single node: %v", err)
+	} else {
+		w.isSNO = ok
+	}
+	return nil
+}
+
+func snapshotOcAdmUpgradeStatus(ch chan *snapshot) {
+	// TODO: I _think_ this should somehow use the adminRESTConfig given to StartCollection but I don't know how to
+	//       how to do pass that to exutil.NewCLI* or if it is even possible. It seems to work this way though.
+	oc := exutil.NewCLIWithoutNamespace("adm-upgrade-status").AsAdmin()
+	now := time.Now()
+
+	var out string
+	var err error
+	// retry on brief apiserver unavailability
+	if errWait := wait.PollUntilContextTimeout(context.Background(), 10*time.Second, 2*time.Minute, true, func(context.Context) (bool, error) {
+		cmd := oc.Run("adm", "upgrade", "status").EnvVar("OC_ENABLE_CMD_UPGRADE_STATUS", "true")
+		out, err = cmd.Output()
+		if err != nil {
+			return false, nil
+		}
+		return true, nil
+	}); errWait != nil {
+		out = ""
+		err = errWait
+	}
+	ch <- &snapshot{when: now, out: out, err: err}
+}
+
+func (w *monitor) StartCollection(ctx context.Context, adminRESTConfig *rest.Config, recorder monitorapi.RecorderWriter) error {
+	if w.notSupportedReason != nil {
+		return w.notSupportedReason
+	}
+	// TODO: The double goroutine spawn should probably be placed under some abstraction
+	go func(ctx context.Context) {
+		snapshots := make(chan *snapshot)
+		go func() {
+			for snap := range snapshots {
+				// TODO: Maybe also collect some cluster resources (CV? COs?) through recorder?
+				w.ocAdmUpgradeStatus[snap.when] = snap
+			}
+			w.collectionDone <- struct{}{}
+		}()
+		// TODO: Configurable interval?
+		// TODO: Collect multiple invocations (--details)? Would need more another producer/consumer pair and likely
+		//       collectionDone would need to be a WaitGroup
+
+		wait.UntilWithContext(ctx, func(ctx context.Context) { snapshotOcAdmUpgradeStatus(snapshots) }, time.Minute)
+		// The UntilWithContext blocks until the framework cancels the context when it wants tests to stop -> when we
+		// get here, we know last snapshotOcAdmUpgradeStatus producer wrote to the snapshots channel, we can close it
+		// which in turn will allow the consumer to finish and signal collectionDone.
+		close(snapshots)
+	}(ctx)
+
+	return nil
+}
+
+func (w *monitor) CollectData(ctx context.Context, storageDir string, beginning, end time.Time) (monitorapi.Intervals, []*junitapi.JUnitTestCase, error) {
+	if w.notSupportedReason != nil {
+		return nil, nil, w.notSupportedReason
+	}
+
+	// The framework cancels the context it gave StartCollection before it calls CollectData, but we need to wait for
+	// the collection goroutines spawned in StartedCollection to finish
+	<-w.collectionDone
+
+	noFailures := &junitapi.JUnitTestCase{
+		Name: "[sig-cli][OCPFeatureGate:UpgradeStatus] oc amd upgrade status never fails",
+	}
+
+	var failures []string
+	var total int
+	for when, observed := range w.ocAdmUpgradeStatus {
+		total++
+		if observed.err != nil {
+			failures = append(failures, fmt.Sprintf("- %s: %v", when.Format(time.RFC3339), observed.err))
+		}
+	}
+
+	// Zero failures is too strict for at least SNO clusters
+	p := (len(failures) / total) * 100
+	if (!w.isSNO && p > 0) || (w.isSNO && p > 10) {
+		noFailures.FailureOutput = &junitapi.FailureOutput{
+			Message: fmt.Sprintf("oc adm upgrade status failed %d times (of %d)", len(failures), len(w.ocAdmUpgradeStatus)),
+			Output:  strings.Join(failures, "\n"),
+		}
+	}
+
+	// TODO: Maybe utilize Intervals somehow and do tests in ComputeComputedIntervals and EvaluateTestsFromConstructedIntervals
+
+	return nil, []*junitapi.JUnitTestCase{noFailures}, nil
+}
+
+func (w *monitor) ConstructComputedIntervals(ctx context.Context, startingIntervals monitorapi.Intervals, recordedResources monitorapi.ResourcesMap, beginning, end time.Time) (monitorapi.Intervals, error) {
+	return nil, w.notSupportedReason
+}
+
+func (w *monitor) EvaluateTestsFromConstructedIntervals(ctx context.Context, finalIntervals monitorapi.Intervals) ([]*junitapi.JUnitTestCase, error) {
+	if w.notSupportedReason != nil {
+		return nil, w.notSupportedReason
+	}
+	return nil, nil
+}
+
+func (w *monitor) WriteContentToStorage(ctx context.Context, storageDir, timeSuffix string, finalIntervals monitorapi.Intervals, finalResourceState monitorapi.ResourcesMap) error {
+	folderPath := path.Join(storageDir, "adm-upgrade-status")
+	if err := os.MkdirAll(folderPath, os.ModePerm); err != nil {
+		return fmt.Errorf("unable to create directory %s: %w", folderPath, err)
+	}
+
+	var errs []error
+	for when, observed := range w.ocAdmUpgradeStatus {
+		outputFilename := fmt.Sprintf("adm-upgrade-status-%s_%s.txt", when, timeSuffix)
+		outputFile := filepath.Join(folderPath, outputFilename)
+		if err := os.WriteFile(outputFile, []byte(observed.out), 0644); err != nil {
+			errs = append(errs, fmt.Errorf("failed to write %s: %w", outputFile, err))
+		}
+	}
+	return errors.NewAggregate(errs)
+}
+
+func (*monitor) Cleanup(ctx context.Context) error {
+	return nil
+}