kubernetes-sigs · k8s-ci-robot · Aug 27, 2025 · Jul 7, 2025 · Jul 30, 2025 · Jul 30, 2025
diff --git a/pkg/controllers/controllers.go b/pkg/controllers/controllers.go
@@ -85,9 +85,6 @@ func NewControllers(
 		informer.NewNodePoolController(kubeClient, cloudProvider, cluster),
 		informer.NewNodeClaimController(kubeClient, cloudProvider, cluster),
 		termination.NewController(clock, kubeClient, cloudProvider, terminator.NewTerminator(clock, kubeClient, evictionQueue, recorder), recorder),
-		metricspod.NewController(kubeClient, cluster),
-		metricsnodepool.NewController(kubeClient, cloudProvider),
-		metricsnode.NewController(cluster),
 		nodepoolreadiness.NewController(kubeClient, cloudProvider),
 		nodepoolregistrationhealth.NewController(kubeClient, cloudProvider),
 		nodepoolcounter.NewController(kubeClient, cloudProvider, cluster),
@@ -99,25 +96,32 @@ func NewControllers(
 		nodeclaimdisruption.NewController(clock, kubeClient, cloudProvider),
 		nodeclaimhydration.NewController(kubeClient, cloudProvider),
 		nodehydration.NewController(kubeClient, cloudProvider),
-		status.NewController[*v1.NodeClaim](
-			kubeClient,
-			mgr.GetEventRecorderFor("karpenter"),
-			status.EmitDeprecatedMetrics,
-			status.WithHistogramBuckets(prometheus.ExponentialBuckets(0.5, 2, 15)), // 0.5, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192
-			status.WithLabels(append(lo.Map(cloudProvider.GetSupportedNodeClasses(), func(obj status.Object, _ int) string { return v1.NodeClassLabelKey(object.GVK(obj).GroupKind()) }), v1.NodePoolLabelKey)...),
-		),
-		status.NewController[*v1.NodePool](
-			kubeClient,
-			mgr.GetEventRecorderFor("karpenter"),
-			status.EmitDeprecatedMetrics,
-			status.WithHistogramBuckets(prometheus.ExponentialBuckets(0.5, 2, 15)), // 0.5, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192
-		),
-		status.NewGenericObjectController[*corev1.Node](
-			kubeClient,
-			mgr.GetEventRecorderFor("karpenter"),
-			status.WithHistogramBuckets(prometheus.ExponentialBuckets(0.5, 2, 15)), // 0.5, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192
-			status.WithLabels(append(lo.Map(cloudProvider.GetSupportedNodeClasses(), func(obj status.Object, _ int) string { return v1.NodeClassLabelKey(object.GVK(obj).GroupKind()) }), v1.NodePoolLabelKey, v1.NodeInitializedLabelKey)...),
-		),
+	}
+
+	if !options.FromContext(ctx).SimplifiedMetrics {
+		controllers = append(controllers,
+			metricspod.NewController(kubeClient, cluster),
+			metricsnodepool.NewController(kubeClient, cloudProvider),
+			metricsnode.NewController(cluster),
+			status.NewController[*v1.NodeClaim](
+				kubeClient,
+				mgr.GetEventRecorderFor("karpenter"),
+				status.EmitDeprecatedMetrics,
+				status.WithHistogramBuckets(prometheus.ExponentialBuckets(0.5, 2, 15)), // 0.5, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192
+				status.WithLabels(append(lo.Map(cloudProvider.GetSupportedNodeClasses(), func(obj status.Object, _ int) string { return v1.NodeClassLabelKey(object.GVK(obj).GroupKind()) }), v1.NodePoolLabelKey)...),
+			),
+			status.NewController[*v1.NodePool](
+				kubeClient,
+				mgr.GetEventRecorderFor("karpenter"),
+				status.EmitDeprecatedMetrics,
+				status.WithHistogramBuckets(prometheus.ExponentialBuckets(0.5, 2, 15)), // 0.5, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192
+			),
+			status.NewGenericObjectController[*corev1.Node](
+				kubeClient,
+				mgr.GetEventRecorderFor("karpenter"),
+				status.WithHistogramBuckets(prometheus.ExponentialBuckets(0.5, 2, 15)), // 0.5, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192
+				status.WithLabels(append(lo.Map(cloudProvider.GetSupportedNodeClasses(), func(obj status.Object, _ int) string { return v1.NodeClassLabelKey(object.GVK(obj).GroupKind()) }), v1.NodePoolLabelKey, v1.NodeInitializedLabelKey)...)),
+		)
 	}
 
 	// The cloud provider must define status conditions for the node repair controller to use to detect unhealthy nodes

diff --git a/pkg/operator/options/options.go b/pkg/operator/options/options.go
@@ -85,6 +85,7 @@ type Options struct {
 	minValuesPolicyRaw      string
 	MinValuesPolicy         MinValuesPolicy
 	FeatureGates            FeatureGates
+	SimplifiedMetrics       bool
 }
 
 type FlagSet struct {
@@ -124,6 +125,7 @@ func (o *Options) AddFlags(fs *FlagSet) {
 	fs.StringVar(&o.preferencePolicyRaw, "preference-policy", env.WithDefaultString("PREFERENCE_POLICY", string(PreferencePolicyRespect)), "How the Karpenter scheduler should treat preferences. Preferences include preferredDuringSchedulingIgnoreDuringExecution node and pod affinities/anti-affinities and ScheduleAnyways topologySpreadConstraints. Can be one of 'Ignore' and 'Respect'")
 	fs.StringVar(&o.minValuesPolicyRaw, "min-values-policy", env.WithDefaultString("MIN_VALUES_POLICY", string(MinValuesPolicyStrict)), "Min values policy for scheduling. Options include 'Strict' for existing behavior where min values are strictly enforced or 'BestEffort' where Karpenter relaxes min values when it isn't satisfied.")
 	fs.StringVar(&o.FeatureGates.inputStr, "feature-gates", env.WithDefaultString("FEATURE_GATES", "NodeRepair=false,ReservedCapacity=true,SpotToSpotConsolidation=false,NodeOverlay=false"), "Optional features can be enabled / disabled using feature gates. Current options are: NodeRepair, ReservedCapacity, and SpotToSpotConsolidation.")
+	fs.BoolVarWithEnv(&o.SimplifiedMetrics, "simplified-metrics", "SIMPLIFIED_METRICS", false, "Optionally disable generic cluster state metrics")
 }
 
 func (o *Options) Parse(fs *FlagSet, args ...string) error {